Apache POI使用

使用apache poi解析 Excel文件：

package excellucene;

import java.io.File;

import java.io.FileInputStream;

import java.io.FileNotFoundException;

import java.io.FileWriter;

import java.io.FilenameFilter;

import java.io.IOException;

import java.io.InputStream;

import java.io.PrintWriter;

import org.apache.poi.EncryptedDocumentException;

import org.apache.poi.hssf.extractor.ExcelExtractor;

import org.apache.poi.hssf.usermodel.HSSFWorkbook;

import org.apache.poi.ss.usermodel.Cell;

import org.apache.poi.ss.usermodel.Row;

import org.apache.poi.ss.usermodel.Sheet;

import org.apache.poi.ss.usermodel.Workbook;

import org.apache.poi.ss.usermodel.WorkbookFactory;

import com.sun.media.sound.InvalidFormatException;

public class ParseExcel {

    public static void main(String[] args) throws IOException {

        String path = "C:\\Users\\Desktop\\a01hos\\img";

        File f = new File(path);

        File[] files = f.listFiles();

        System.out.println(files.length);

        File[] filesxls = f.listFiles(new FilenameFilter() {

            public boolean accept(File dir, String name) {

                if (name.endsWith(".xls") || name.endsWith(".xlsx")) {

                    return true;

                }

                return false;

            }

        });

        System.out.println("Excel文件有： " + filesxls.length);

        for (File f2 : filesxls) {

            String fileDirectPathName = f2.getCanonicalPath();

            System.out.println(fileDirectPathName);

            // System.out.println("文件名： " + f2.getName());

            new ParseExcel().parseXml(fileDirectPathName);

        }

        /*

         * IndexWriter writer; // 创建 Lucene Index Writer Directory dir =

         * FSDirectory.open(Paths.get("f:/excelindex")); writer = new

         * IndexWriter(dir, new IndexWriterConfig( new StandardAnalyzer()));

         *

         * for (File f2 : filesxls) { // FileReader fr = new FileReader(f); //

         * BufferedReader br = new BufferedReader(fr);

         * System.out.println(f2.getCanonicalPath()); System.out.println("文件名： "

         * + f2.getName());

         *

         *

         * // 创建dom对象创建索引 创建索引 Document document = new Document();

         *

         * Document doc = new Document(); doc.add(new Field("contents",

         * ExcelFileReader(f2.getCanonicalPath()), TextField.TYPE_NOT_STORED));

         * doc.add(new Field("filename", f2.getName(), TextField.TYPE_STORED));

         * doc.add(new StringField("fullpath", f2.getCanonicalPath(),

         * Field.Store.YES));

         *

         * writer.addDocument(doc);

         *

         * writer.numDocs();

         *

         * }

         */

    }

    /**

     * Excel表格提取数据

     *

     * @param fileName

     *            路径

     * @return

     * @throws IOException

     */

    public static String ExcelFileReader(String fileName) throws IOException {

        InputStream path = new FileInputStream(fileName);

        String content = null;

        // 1、创建新的Excel文件

        HSSFWorkbook wb = new HSSFWorkbook(path);

        ExcelExtractor extractor = new ExcelExtractor(wb);

        extractor.setFormulasNotResults(true);

        extractor.setIncludeSheetNames(false);

        content = extractor.getText();

        return content;

    }

    public void parseXml(String filename) {

        Workbook wb = null;

        try {

            wb = WorkbookFactory.create(new File(filename));

            Sheet sheet = wb.getSheetAt(0);

            for (Row row : sheet) {

                for (Cell cell : row) {

                    System.out.print(getCellValue(cell) + "---");

                    save(getCellValue(cell) + "---");

                }

                System.out.println();

            }

        } catch (EncryptedDocumentException e) {

            e.printStackTrace();

        } catch (InvalidFormatException e) {

            e.printStackTrace();

        } catch (IOException e) {

            e.printStackTrace();

        } catch (org.apache.poi.openxml4j.exceptions.InvalidFormatException e) {

            // TODO Auto-generated catch block

            e.printStackTrace();

        }

    }

    public Object getCellValue(Cell cell) {

        int type = cell.getCellType();

        String show = null;

        switch (type) {

        case Cell.CELL_TYPE_BLANK:// 空值

            show = null;

            break;

        case Cell.CELL_TYPE_BOOLEAN:// Boolean

            show = String.valueOf(cell.getBooleanCellValue());

            break;

        case Cell.CELL_TYPE_ERROR:// 故障

            show = String.valueOf(cell.getErrorCellValue());

            break;

        case Cell.CELL_TYPE_FORMULA:// 公式

            show = cell.getCellFormula();

            break;

        case Cell.CELL_TYPE_NUMERIC:// 数字

            show = String.valueOf(cell.getNumericCellValue());

            break;

        case Cell.CELL_TYPE_STRING:// 字符串

            show = cell.getStringCellValue();

            break;

        default:

            show = null;

        }

        return show;

    }

    /**

     * 保存字符串到文本中

     *

     * @param str

     */

    public boolean save(String str) {

        boolean flag = false; // 声明操作标记

        String fileName = "file/haha.txt"; // 定义文件名

        File f = new File(fileName);

        if(!f.exists()){

            try {

                f.createNewFile();

            } catch (IOException e) {

                e.printStackTrace();

            }

        }

        FileWriter fw = null; // 用来写入字符文件的便捷类

        PrintWriter out = null; // 向文本输出流打印对象的格式化表示形式类

        try {

            fw = new FileWriter(f, true); // 创建一个FileWriter

            out = new PrintWriter(fw); // 创建一个PrintWriter，以追加方式将内容插入到最后一行

            out.println(str); // 将字符串打印到文本中

            out.flush(); // 刷新缓存

            flag = true;

        } catch (FileNotFoundException e) {

            e.printStackTrace();

        } catch (IOException e) {

            e.printStackTrace();

        } finally {

            try {

                // 关闭PrintWriter

                if (out != null) {

                    out.close();

                    out = null;

                }

                // 关闭FileWriter

                if (fw != null) {

                    fw.close();

                    fw = null;

                }

            } catch (IOException e) {

                e.printStackTrace();

            }

        }

        return flag;

    }

}

使用lucene建立索引：

package excellucene;

import java.io.IOException;

import java.nio.file.Paths;

import org.apache.lucene.analysis.Analyzer;

import org.apache.lucene.analysis.standard.StandardAnalyzer;

import org.apache.lucene.document.Document;

import org.apache.lucene.index.DirectoryReader;

import org.apache.lucene.index.IndexReader;

import org.apache.lucene.queryparser.classic.ParseException;

import org.apache.lucene.queryparser.classic.QueryParser;

import org.apache.lucene.search.IndexSearcher;

import org.apache.lucene.search.Query;

import org.apache.lucene.search.ScoreDoc;

import org.apache.lucene.search.TopDocs;

import org.apache.lucene.store.FSDirectory;

public class SearchExcel {

    public static void main(String[] args) throws IOException, ParseException {

        if(args.length!=2){

            throw new IllegalArgumentException(SearchExcel.class.getName()+" <> <query>");

        }

//        String indexDir = args[0];//解析输入的索引路径

//        String q = args[1];//解析输入的查询字符串

        String indexDir = "F:\\excelindex";

        String q = "zhangxing";

        search(indexDir, q);

    }

    public static void search(String indexDir, String q) throws IOException, ParseException{

//        Directory dir = FSDirectory.open(Paths.get(indexDir));

        IndexReader reader = DirectoryReader.open(FSDirectory.open(Paths.get(indexDir)));

        IndexSearcher is = new IndexSearcher(reader);

        Analyzer analyzer = new StandardAnalyzer();

        // 需要添加  .jar 包

//        lucene-queryparser-7.4.0.jar

        QueryParser parser = new QueryParser("filename", analyzer);

        Query query = parser.parse(q);

        long start = System.currentTimeMillis();

        TopDocs hits = is.search(query, 10);

        long end = System.currentTimeMillis();

        System.err.println("Found "+hits.totalHits+" document(s) (in "+ (end-start) +" milliseconds) that matched query'"+q+"':");

        for(ScoreDoc scoreDoc:hits.scoreDocs){

            Document doc = is.doc(scoreDoc.doc);

            System.out.println(doc.get("fullpath"));

        }

    }

}

使用了的jar包：

Apache POI使用的更多相关文章

简单使用Apache POI
Apache POI是一个纯Java编写用来操作Microsoft Office的框架,最常见的应用是让服务器后台按照特定的数据生成Excel表格提供给用户实用.前段时间因为项目的需要被大量使用,使用 ...
使用maven引入Apache poi jar包
maven构建的项目-->pom.xml文件 eclipse提供Dependencies直接添加依赖jar包的工具:直接搜索poi以及poi-ooxml即可,maven会自动依赖需要的jar包: ...
apache poi导出excel报表
Apache POI 是用Java编写的免费开源的跨平台的 Java API,Apache POI提供API给Java程式对Microsoft Office格式档案读和写的功能.POI为"P ...
Apache POI 实现对 Excel 文件读写
1. Apache POI 简介 Apache POI是Apache软件基金会的开放源码函式库. 提供API给Java应用程序对Microsoft Office格式档案读和写的功能. 老外起名字总是很 ...
APACHE POI教程 --java应用程序用POI与Excel交互
POI报表 --用POI与Excel交互 AURISOFT 第一章 POI简介 --Jakata Poi HSSF:纯java的Excel解决方案在我们实际的开发中,表现层的解决方案虽然有多样,但是 ...
apache poi 生成excel
ExcelBuilder.Java package com.coracle.yk.xmanager.util.poi; import com.coracle.yk.xframework.util.Bl ...
weblogic 12c下jxls导出excel报错Could not initialize class org.apache.poi.xssf.usermodel.XSSFVMLDrawing
周一,开发反馈weblogic 12c下jxls导出excel报错,公司环境和UAT环境均报错,看日志如下: 2016-06-08 09:16:55,825 ERROR org.jxls.util.T ...
[转]How to insert a row between two rows in an existing excel with HSSF (Apache POI)
本文转自:http://stackoverflow.com/questions/5785724/how-to-insert-a-row-between-two-rows-in-an-existing- ...
如何用Apache POI操作Excel文件-----如何对一个单元格加注解？
有的时候,我们需要通过操作Apache POI,在生成Cell数据的同时,能对其生成的Cell,加上注解(comments),类似于下面的. 那么对于这种情况,我们的代码应该如何写呢? 借花献佛,我就 ...
如何用Apache POI操作Excel文件-----如何在已有的Excel文件中插入一行新的数据？
在POI的第一节入门中,我们提供了两个简单的例子,一个是如何用Apache POI新建一个工作薄,另外一个例子是,如果用Apache POI新建一个工作表.那么在这个章节里面,我将会给大家演示一下,如 ...

随机推荐

module.exports,exports,export和export default,import与require区别与联系
还在为module.exports.exports.export和export default,import和require区别与联系发愁吗,这一篇基本就够了! 一.首先搞清楚一个基本问题: modu ...
小y的质数
题目链接:https://ac.nowcoder.com/acm/contest/634/C 链接:https://ac.nowcoder.com/acm/contest/634/C来源:牛客网题目 ...
eclipse相关问题汇总
安装subclipse svn工具: 配置JavaHL:http://subclipse.tigris.org/wiki/JavaHL#head-5bf26515097c3231c1b04dfdb22 ...
android 小工具：pc 上用 curl 命令打开手机浏览器，浏览指定网址
测试 API 时或其它情况经常需要在手机浏览器中输入 url 一长串的 url 输起来真是麻烦 AirDroid 很强大也不用数据线,但有时老断开连接,不是很爽.发到手机 qq 吧还得手动粘贴所以自 ...
ngx.location.capture 只支持相对路径，不能用绝对路径
ngx.location.capture 是非阻塞的,ngx.location.capture也可以用来完成http请求,但是它只能请求到相对于当前nginx服务器的路径,不能使用之前的绝对路径进行访 ...
MySQL事务实现原理
MySQL事务隔离级别的实现原理知识储备只有InnoDB支持事务,所以这里说的事务隔离级别是指InnoDB下的事务隔离级别隔离级别读未提交:一个事务可以读取到另一个事务未提交的修改.这会带来脏 ...
liunx下查看日志最实用命令和方法
1.业务系统访问量不是很大的时候,使用这个,有bug的地方操作下,直接看最后操作的日志,就是你刚才操作的地方,好好查bug吧 tail -fn100 catalina.log 查询日志尾部 ...
错误：严重: Servlet.service() for servlet [appServlet] in context with path [] threw exception [Request processing failed; nested exception is org.mybatis.spring.MyBatisSystemException: nested exception is
严重: Servlet.service() for servlet [appServlet] in context with path [] threw exception [Request proc ...
ASP.NET MVC4 新手入门教程之一 ---1.介绍ASP.NET MVC4
你会建造您将实现一个简单的电影清单应用程序支持创建. 编辑. 搜索和清单数据库中的电影.下面是您将构建的应用程序的两个屏幕截图.它包括显示来自数据库的电影列表的网页: 应用程序还允许您添加. 编辑和 ...
设置固定ip后无法上公网
把电脑ip设置成固定ip后,发现其不能上公网,突然想到要设置DNS. 运行cmd程序,输入命令ipconfig /all查看此网络的DNS,设置固定ip 时添加此DNS地址即可.

Apache POI使用

Apache POI使用的更多相关文章

随机推荐

热门专题