2018-03-21 11:34:44 java脚本批量转换java utf-8 bom源码文件为utf-8编码文件

package com.springbootdubbo;

import java.io.*;
import java.util.ArrayList;
import java.util.List;

/**
 *@title : JavaClass 
 *@author:zyh
 *@createDate:2018/11/19 18:30
 *
 **/
public class UTF8BOMConverter extends Reader {

    PushbackInputStream internalIn;

    InputStreamReader internalIn2 = null;

    String defaultEnc;

    private static final int BOM_SIZE = 4;

    /**

     * @param in         inputstream to be read

     * @param defaultEnc default encoding if stream does not have

     *                   BOM marker. Give NULL to use system-level default.

     */

    UTF8BOMConverter(InputStream in, String defaultEnc) {

        internalIn = new PushbackInputStream(in, BOM_SIZE);

        this.defaultEnc = defaultEnc;

    }

    public String getDefaultEncoding() {

        return defaultEnc;

    }

    /**

     * Get stream encoding or NULL if stream is uninitialized.

     * Call init() or read() method to initialize it.

     */

    public String getEncoding() {

        if (internalIn2 == null) return null;

        return internalIn2.getEncoding();

    }

    /**

     * Read-ahead four bytes and check for BOM marks. Extra bytes are

     * unread back to the stream, only BOM bytes are skipped.

     */

    protected void init() throws IOException {

        if (internalIn2 != null) return;

        String encoding;

        byte bom[] = new byte[BOM_SIZE];

        int n, unread;

        n = internalIn.read(bom, 0, bom.length);

        if ((bom[0] == (byte) 0x00) && (bom[1] == (byte) 0x00) &&

                (bom[2] == (byte) 0xFE) && (bom[3] == (byte) 0xFF)) {

            encoding = "UTF-32BE";

            unread = n - 4;

        } else if ((bom[0] == (byte) 0xFF) && (bom[1] == (byte) 0xFE) &&

                (bom[2] == (byte) 0x00) && (bom[3] == (byte) 0x00)) {

            encoding = "UTF-32LE";

            unread = n - 4;

        } else if ((bom[0] == (byte) 0xEF) && (bom[1] == (byte) 0xBB) &&

                (bom[2] == (byte) 0xBF)) {

            encoding = "UTF-8";

            unread = n - 3;

        } else if ((bom[0] == (byte) 0xFE) && (bom[1] == (byte) 0xFF)) {

            encoding = "UTF-16BE";

            unread = n - 2;

        } else if ((bom[0] == (byte) 0xFF) && (bom[1] == (byte) 0xFE)) {

            encoding = "UTF-16LE";

            unread = n - 2;

        } else {

            // Unicode BOM mark not found, unread all bytes

            encoding = defaultEnc;

            unread = n;

        }

        //System.out.println("read=" + n + ", unread=" + unread);

        if (unread > 0) internalIn.unread(bom, (n - unread), unread);

        // Use given encoding

        if (encoding == null) {
            internalIn2 = new InputStreamReader(internalIn);

        } else {

            internalIn2 = new InputStreamReader(internalIn, encoding);

        }

    }

    public void close() throws IOException {

        init();

        internalIn2.close();

    }

    public int read(char[] cbuf, int off, int len) throws IOException {

        init();

        return internalIn2.read(cbuf, off, len);

    }

    private static void readContentAndSaveWithEncoding(String filePath, String readEncoding, String saveEncoding) throws Exception {

        saveContent(filePath, readContent(filePath, readEncoding), saveEncoding);

    }

    private static void saveContent(String filePath, String content, String encoding) throws Exception {

        FileOutputStream fos = new FileOutputStream(filePath);

        OutputStreamWriter w = new OutputStreamWriter(fos, encoding);

        w.write(content);

        w.flush();

    }

    private static String readContent(String filePath, String encoding) throws Exception {

        FileInputStream file = new FileInputStream(new File(filePath));

        BufferedReader br = new BufferedReader(new UTF8BOMConverter(file, encoding));

        String line = null;

        String fileContent = "";

        while ((line = br.readLine()) != null) {

            fileContent = fileContent + line;

            fileContent += "\r\n";

        }

        return fileContent;

    }

    private static List<String> getPerlineFileName(String filePath) throws Exception {

        FileInputStream file = new FileInputStream(new File(filePath));

        BufferedReader br = new BufferedReader(new InputStreamReader(file, "UTF-8"));

        String line = null;

        List<String> list = new ArrayList<String>();

        while ((line = br.readLine()) != null) {

            list.add(line);

        }

        return list;

    }

    private static List<String> getAllFilePaths(File filePath, List<String> filePaths) {

        File[] files = filePath.listFiles();

        if (files == null) {

            return filePaths;

        }

        for (File f : files) {

            if (f.isDirectory()) {

                filePaths.add(f.getPath());

                getAllFilePaths(f, filePaths);

            } else {

                filePaths.add(f.getPath());

            }

        }

        return filePaths;

    }

    public static void main(String[] args) throws Exception {

        String suffix = ".java";

        List<String> paths = new ArrayList<String>();

        paths = getAllFilePaths(new File("E:\\mgtt\\DING"), paths);

        List<String> pathList = new ArrayList<String>();

        for (String path : paths) {

            if (path.endsWith(suffix)) {

                pathList.add(path);
            }

        }

        for (String path : pathList) {

            readContentAndSaveWithEncoding(path, "UTF-8", "UTF-8");

            System.out.println(path + "转换成功");
        }

    }

}

2018-03-21 11:34:44 java脚本批量转换java utf-8 bom源码文件为utf-8编码文件的更多相关文章

GCN代码分析 2019.03.12 22:34:54字数 560阅读 5714 本文主要对GCN源码进行分析。
GCN代码分析 1 代码结构 . ├── data // 图数据 ├── inits // 初始化的一些公用函数 ├── layers // GCN层的定义 ├── metrics // 评测指标 ...
图书管理系统（Java实现，十个数据表，含源码、ER图，超详细报告解释，2020.7.11更新）
图书管理系统数据库设计实验报告文章目录更新日志 1.概述 2.需求分析 2.1需要实现的功能 2.2业务流程图 2.2.1学生流程图 2.2.2管理员流程图 2.2.3超级管理员流程图 2.3功能 ...
java学习笔记（3）数据类型、源码、反码、补码、精度损失、基本数据类型互相转换
关于java中的数据类型: 1.数据类型的作用是什么? 程序当中有很多数据,每一个数据都是有相关类型的,不同数据类型的数据占用的空间大小不同. 数据类型的作用是指导java虚拟机(JVM)在运行程序的 ...
Java 集合系列10之 HashMap详细介绍(源码解析)和使用示例
概要这一章,我们对HashMap进行学习.我们先对HashMap有个整体认识,然后再学习它的源码,最后再通过实例来学会使用HashMap.内容包括:第1部分 HashMap介绍第2部分 HashMa ...
java io系列02之 ByteArrayInputStream的简介,源码分析和示例(包括InputStream)
我们以ByteArrayInputStream,拉开对字节类型的“输入流”的学习序幕.本章,我们会先对ByteArrayInputStream进行介绍,然后深入了解一下它的源码,最后通过示例来掌握它的 ...
Java 集合系列07之 Stack详细介绍(源码解析)和使用示例
概要学完Vector了之后,接下来我们开始学习Stack.Stack很简单,它继承于Vector.学习方式还是和之前一样,先对Stack有个整体认识,然后再学习它的源码:最后再通过实例来学会使用它. ...
java基础解析系列(十)---ArrayList和LinkedList源码及使用分析
java基础解析系列(十)---ArrayList和LinkedList源码及使用分析目录 java基础解析系列(一)---String.StringBuffer.StringBuilder jav ...
[Spark内核] 第34课：Stage划分和Task最佳位置算法源码彻底解密
本課主題 Job Stage 划分算法解密 Task 最佳位置算法實現解密引言作业调度的划分算法以及 Task 的最佳位置的算法,因为 Stage 的划分是DAGScheduler 工作的核心,这 ...
【转】 Java 集合系列07之 Stack详细介绍(源码解析)和使用示例
概要学完Vector了之后,接下来我们开始学习Stack.Stack很简单,它继承于Vector.学习方式还是和之前一样,先对Stack有个整体认识,然后再学习它的源码:最后再通过实例来学会使用它. ...

随机推荐

跨页面传值之Cookie
3.客户端再次访问某站点浏览器将携带Cookie信息的指令,将获得的信息参与编译. 4.将含有Cookie信息参与编译的页面发回给浏览器其中如果有相关的设置Cookie的指令.将再次通过浏览器,写 ...
Checkbox与foreach循环
呈现形态&控件语法 <span style=”display:inline-block;”> <input id=”checkBox2” type=”checkBox” na ...
Sql批处理语句
同时写3个批处理,如果前2个批处理没有问题,最后一个有错误那么3个批处理都不会执行需要注意列如: use Materl GO select * from t_icitem GO inset into ...
ArrayList 集合
ArrayList 集合:很多数据的一个集合数组:长度不可变.类型单一集合的好处:长度可以任意改变类型随便集合长度都的问题很多数据的集合数组类型不可变长度单一 ...
MarkDown 语言简单使用
# Markdown file ![alt img is error](http://cdn2.jianshu.io/assets/web/logo-58fd04f6f0de908401aa561cd ...
glyphicons-halflings-regular.woff2 文件 404
搜索了下,果然是因为mine没有配置的原因. http://stackoverflow.com/questions/32300578/how-to-remove-error-about-glyphic ...
Cocos2d-js 开发记录：图片数据资源等的异步加载
这里说的是在需要的使用加载图片,比如游戏中的某个关卡的图片,不用在游戏一开始就加载(万一用户玩不到那关,岂不是很冤,流量费了那么多),否则载入速度也慢.这种方式加载资源要用到cc.loader官方文档 ...
Bootstrap导航栏navbar源码分析
1.本文目地:分析bootstrap导航栏及其响应式的实现方式,提升自身css水平先贴一个bootstrap的导航栏模板 http://v3.bootcss.com/examples/navbar- ...
ie 9 渐变背景色兼容问题
/*窗口背景*/ .window { background-color: #fff; background: -webkit-linear-gradient(top,#EFF5FF 0, ...
arcgis server 10.1 发布动态图层展示海量及频繁更新的数据步骤
Arcgis server 发布动态图层及调用动态图层做这个动态图层功能的原由是有一个30万的数据需要通过arcgis GP工具转成shp然后渲染加载进地图,原来的做法是遍历生成shp面要素,读 ...

2018-03-21 11:34:44 java脚本批量转换java utf-8 bom源码文件为utf-8编码文件

2018-03-21 11:34:44 java脚本批量转换java utf-8 bom源码文件为utf-8编码文件的更多相关文章

随机推荐

热门专题