java csv 切换单元格_使用java将PDF转换为CSV

强化
2023-12-01

请参阅以下任何使用Java将PDF提取为CSV的示例:

https://github.com/pdftables/java-pdftables-api

. 每个页面都是独立的,因此PDF的动态特性不应该成为问题。你可以在他们的网站上使用免费试用版。

package com.pdftables.examples;

import java.io.File;

import java.util.Arrays;

import java.util.List;

import org.apache.commons.io.FileUtils;

import org.apache.http.HttpEntity;

import org.apache.http.client.config.CookieSpecs;

import org.apache.http.client.config.RequestConfig;

import org.apache.http.client.methods.CloseableHttpResponse;

import org.apache.http.client.methods.HttpPost;

import org.apache.http.entity.mime.MultipartEntityBuilder;

import org.apache.http.entity.mime.content.FileBody;

import org.apache.http.impl.client.CloseableHttpClient;

import org.apache.http.impl.client.HttpClients;

public class ConvertToFile {

private static List formats = Arrays.asList(new String[] { "csv", "xml", "xlsx-single", "xlsx-multiple" });

public static void main(String[] args) throws Exception {

if (args.length != 3) {

System.out.println("Command line: ");

System.exit(1);

}

final String apiKey = args[0];

final String format = args[1].toLowerCase();

final String pdfFilename = args[2];

if (!formats.contains(format)) {

System.out.println("Invalid output format: \"" + format + "\"");

System.exit(1);

}

// Avoid cookie warning with default cookie configuration

RequestConfig globalConfig = RequestConfig.custom().setCookieSpec(CookieSpecs.STANDARD).build();

File inputFile = new File(pdfFilename);

if (!inputFile.canRead()) {

System.out.println("Can't read input PDF file: \"" + pdfFilename + "\"");

System.exit(1);

}

try (CloseableHttpClient httpclient = HttpClients.custom().setDefaultRequestConfig(globalConfig).build()) {

HttpPost httppost = new HttpPost("https://pdftables.com/api?format=" + format + "&key=" + apiKey);

FileBody fileBody = new FileBody(inputFile);

HttpEntity requestBody = MultipartEntityBuilder.create().addPart("f", fileBody).build();

httppost.setEntity(requestBody);

System.out.println("Sending request");

try (CloseableHttpResponse response = httpclient.execute(httppost)) {

if (response.getStatusLine().getStatusCode() != 200) {

System.out.println(response.getStatusLine());

System.exit(1);

}

HttpEntity resEntity = response.getEntity();

if (resEntity != null) {

final String outputFilename = getOutputFilename(pdfFilename, format.replaceFirst("-.*$", ""));

System.out.println("Writing output to " + outputFilename);

final File outputFile = new File(outputFilename);

FileUtils.copyToFile(resEntity.getContent(), outputFile);

} else {

System.out.println("Error: file missing from response");

System.exit(1);

}

}

}

}

private static String getOutputFilename(String pdfFilename, String suffix) {

if (pdfFilename.length() >= 5 && pdfFilename.toLowerCase().endsWith(".pdf")) {

return pdfFilename.substring(0, pdfFilename.length() - 4) + "." + suffix;

} else {

return pdfFilename + "." + suffix;

}

}

}

 类似资料: