Java 用于使用apache POI转换为CSV时的xlsx单元格数据

Java 用于使用apache POI转换为CSV时的xlsx单元格数据,java,csv,apache-poi,supercsv,Java,Csv,Apache Poi,Supercsv,我正在使用下面的程序将xlsx转换为csv,如果每个单元格字符串包含换行符(/n)或分隔符,我想在其中添加引号字符(“”) import java.io.File; import java.io.FileInputStream; import java.io.FileOutputStream; import java.util.Iterator; import org.apache.poi.ss.usermodel.Cell; import org.apache.poi.ss.usermode

我正在使用下面的程序将xlsx转换为csv,如果每个单元格字符串包含换行符(/n)或分隔符,我想在其中添加引号字符(“”)

import java.io.File;
import java.io.FileInputStream;
import java.io.FileOutputStream;
import java.util.Iterator;

import org.apache.poi.ss.usermodel.Cell;
import org.apache.poi.ss.usermodel.Row;
import org.apache.poi.xssf.usermodel.XSSFSheet;
import org.apache.poi.xssf.usermodel.XSSFWorkbook;

public class XlsxtoCSV {

    static void xlsx(File inputFile, File outputFile) {
        // For storing data into CSV files
        StringBuffer data = new StringBuffer();

        try {
            FileOutputStream fos = new FileOutputStream(outputFile);
            // Get the workbook object for XLSX file
            XSSFWorkbook wBook = new XSSFWorkbook(new FileInputStream(inputFile));
            // Get first sheet from the workbook
            XSSFSheet sheet = wBook.getSheetAt(0);
            Row row;
            Cell cell;
            // Iterate through each rows from first sheet
            Iterator<Row> rowIterator = sheet.iterator();

            while (rowIterator.hasNext()) {
                row = rowIterator.next();

                // For each row, iterate through each columns
                Iterator<Cell> cellIterator = row.cellIterator();
                while (cellIterator.hasNext()) {

                    cell = cellIterator.next();

                    switch (cell.getCellType()) {
                        case Cell.CELL_TYPE_BOOLEAN:
                            data.append(cell.getBooleanCellValue() + ",");

                            break;
                        case Cell.CELL_TYPE_NUMERIC:
                            data.append(cell.getNumericCellValue() + ",");

                            break;
                        case Cell.CELL_TYPE_STRING:
                            data.append(cell.getStringCellValue() + ",");
                            break;

                        case Cell.CELL_TYPE_BLANK:
                            data.append("" + ",");
                            break;
                        default:
                            data.append(cell + ",");

                    }
                }
            }

            fos.write(data.toString().getBytes());
            fos.close();

        } catch (Exception ioe) {
            ioe.printStackTrace();
        }
    }
    //testing the application 

    public static void main(String[] args) {
        //reading file from desktop
        File inputFile = new File("C:\\Users\\user69\\Desktop\\test.xlsx");
        //writing excel data to csv 
        File outputFile = new File("C:\\Users\\user69\\Desktop\\test1.csv");
        xlsx(inputFile, outputFile);
    }
}
导入java.io.File;
导入java.io.FileInputStream;
导入java.io.FileOutputStream;
导入java.util.Iterator;
导入org.apache.poi.ss.usermodel.Cell;
导入org.apache.poi.ss.usermodel.Row;
导入org.apache.poi.xssf.usermodel.xssfheet;
导入org.apache.poi.xssf.usermodel.xssf工作簿;
公共类XlsxtoCSV{
静态void xlsx(文件输入文件、文件输出文件){
//用于将数据存储到CSV文件中
StringBuffer数据=新的StringBuffer();
试一试{
FileOutputStream fos=新的FileOutputStream(outputFile);
//获取XLSX文件的工作簿对象
XSSF工作簿wBook=新XSSF工作簿(新文件InputStream(inputFile));
//从工作簿中获取第一张工作表
XSSFSheet sheet=wBook.getSheetAt(0);
行行;
细胞;
//从第一张图纸开始遍历每行
迭代器rowIterator=sheet.Iterator();
while(roweiterator.hasNext()){
行=行迭代器。下一步();
//对于每一行,遍历每一列
迭代器cellIterator=row.cellIterator();
while(cellIterator.hasNext()){
cell=cellIterator.next();
开关(cell.getCellType()){
case Cell.Cell\u类型\u布尔值:
data.append(cell.getBooleanCellValue()+“,”);
打破
case Cell.Cell\u类型\u数值:
data.append(cell.getNumericCellValue()+“,”);
打破
case Cell.Cell\u类型\u字符串:
data.append(cell.getStringCellValue()+“,”);
打破
case Cell.Cell\u类型\u空白:
数据。追加(“+”,”);
打破
违约:
数据。追加(单元格+“,”);
}
}
}
fos.write(data.toString().getBytes());
fos.close();
}捕获(异常ioe){
ioe.printStackTrace();
}
}
//测试应用程序
公共静态void main(字符串[]args){
//从桌面读取文件
File inputFile=新文件(“C:\\Users\\user69\\Desktop\\test.xlsx”);
//将excel数据写入csv
File outputFile=新文件(“C:\\Users\\user69\\Desktop\\test1.csv”);
xlsx(输入文件,输出文件);
}
}
根据RFC4180 Csv规则。包含换行符(CRLF)、双引号和逗号的字段应该用双引号括起来。因此,如果单元格数据包含换行符或分隔符(,),在添加到字符串缓冲区之前,我必须格式化单元格数据(数字、字符串或任何其他类型)。请帮助我根据CSV规则格式化单元格数据。

使用类似以下库:

另请参见短文

的回答完全正确。为了扩展他所写的内容,下面是我完整且经过测试的方法,它使用Commons CSV进行实际值打印。不幸的是,我们仍然需要在工作表上迭代,XSSF中没有自动的CSV输出方法,但我遵循了Centic的策略来进行行/单元格迭代

本例输出到
输出流
,但显然
文件
同样容易(在
CSVPrinter
构造函数中使用
FileReader

//将XSSF工作簿转换为CSV并写入提供的OutputStream
私有无效writeWorkbookAsCSVToOutputStream(XSSFWorkbook工作簿,OutputStream out){
CSVPrinter CSVPrinter=null;
试一试{
//或者,如果需要文件输出,则将其更改为基于文件的构造函数
csvPrinter=新的csvPrinter(新的OutputStreamWriter(输出),CSVFormat.DEFAULT);
如果(工作簿!=null){
XSSFSheet sheet=workbook.getSheetAt(0);//sheet#0
迭代器rowIterator=sheet.rowIterator();
while(roweiterator.hasNext()){
行=行迭代器。下一步();
迭代器cellIterator=row.cellIterator();
while(cellIterator.hasNext()){
Cell=cellIterator.next();
csvPrinter.print(cell.getStringCellValue());//此处打印Commons CSV
}
//每行后换行
csvPrinter.println();
}
}
}
捕获(例外e){
log.error(“未能将CSV文件写入输出流”,e);
}
最后{
试一试{
如果(csvPrinter!=null){
//闭合式CSV打印机
csvPrinter.flush();
csvPrinter.close();
}
}
捕获(ioe异常ioe){
日志错误(“关闭CSV打印机时出错”,ioe);
}           
}
}   

为什么不使用众多优秀的开源CSV编写库中的一个,让它为您完成工作?>
final Appendable out = ...;  
final CSVPrinter printer = CSVFormat.DEFAULT.withHeader("H1", "H2").print(out);
...
while (rowIterator.hasNext()) {
    ...
    while (cellIterator.hasNext()) {
        ...
        printer.print(cell.getStringCellValue());
        ...
    }
    printer.println();
}
// Convert an XSSFWorkbook to CSV and write to provided OutputStream
private void writeWorkbookAsCSVToOutputStream(XSSFWorkbook workbook, OutputStream out) {

    CSVPrinter csvPrinter = null;

    try {
        // Or change this to  File-based constructor, if File output is required
        csvPrinter = new CSVPrinter(new OutputStreamWriter(out), CSVFormat.DEFAULT);                

        if (workbook != null) {
            XSSFSheet sheet = workbook.getSheetAt(0); // Sheet #0
            Iterator<Row> rowIterator = sheet.rowIterator();
            while (rowIterator.hasNext()) {               
                Row row = rowIterator.next();
                Iterator<Cell> cellIterator = row.cellIterator();
                while (cellIterator.hasNext()) {
                    Cell cell = cellIterator.next();
                    csvPrinter.print(cell.getStringCellValue()); // Commons CSV prints here
                }
                // Newline after each row
                csvPrinter.println();
            }

        }

    }
    catch (Exception e) {
        log.error("Failed to write CSV file to output stream", e);
    }
    finally {
        try {
            if (csvPrinter != null) {
                // Close CSVPrinter
                csvPrinter.flush();
                csvPrinter.close();
            }
        }
        catch (IOException ioe) {
            log.error("Error when closing CSV Printer", ioe);
        }           
    }
}