Commit 38199d26 authored by R10's avatar R10

Merge branch 'release' of ssh://gitlab.gsstcloud.com:10022/poc/poc-api into release_gdghg

# Conflicts:
#	src/main/java/cn/com/poc/common/utils/FileUtils.java
#	src/test/java/cn/com/poc/utils/FileUtilsTest.java
parents 68a8b931 bd82d679
######mysql数据配置示例#######
hibernate.dialect=org.hibernate.dialect.MySQL5InnoDBDialect
hibernate.show_sql=true
hibernate.format_sql=true
jdbc.driver=com.mysql.jdbc.Driver
jdbc.url=jdbc:mysql://192.168.21.31:3306/gsst_modellink_sit?useSSL=false&useUnicode=true&allowMultiQueries=true&serverTimezone=Asia/Shanghai&characterEncoding=UTF-8
jdbc.username=modellink_root
jdbc.password=56a6a2854424
ds.maxActive=20
ds.minIdle=1
ds.initialSize=1
ds.validationQuery=select 1 from dual
\ No newline at end of file
package cn.com.poc.utils; //package cn.com.poc.utils;
//
import cn.com.poc.common.utils.DocumentLoad; //import cn.com.poc.common.utils.DocumentLoad;
import cn.com.poc.common.utils.FileUtils; //import cn.com.poc.common.utils.FileUtils;
import cn.com.yict.framemax.core.spring.SingleContextInitializer; //import cn.com.yict.framemax.core.spring.SingleContextInitializer;
import org.apache.pdfbox.pdmodel.PDDocument; //import com.aspose.words.Document;
import org.apache.pdfbox.text.PDFTextStripper; //import com.aspose.words.HtmlSaveOptions;
import org.junit.Test; //import com.aspose.words.HtmlVersion;
import org.junit.runner.RunWith; //import com.aspose.words.SaveFormat;
import org.springframework.test.context.ContextConfiguration; //import org.apache.pdfbox.pdmodel.PDDocument;
import org.springframework.test.context.junit4.SpringJUnit4ClassRunner; //import org.apache.pdfbox.text.PDFTextStripper;
import org.springframework.test.context.web.WebAppConfiguration; //import org.junit.runner.RunWith;
//import org.junit.Test;
import java.io.*; //import org.springframework.test.context.ContextConfiguration;
//import org.springframework.test.context.junit4.SpringJUnit4ClassRunner;
/** //import org.springframework.test.context.web.WebAppConfiguration;
* @author alex.yao //
* @date 2025/6/12 //import java.io.*;
*/ //
@RunWith(SpringJUnit4ClassRunner.class) ///**
@ContextConfiguration(initializers = SingleContextInitializer.class) // * @author alex.yao
@WebAppConfiguration // * @date 2025/6/12
public class FileUtilsTest { // */
//@RunWith(SpringJUnit4ClassRunner.class)
//@ContextConfiguration(initializers = SingleContextInitializer.class)
@Test //@WebAppConfiguration
public void test_wordConvertPDF() throws Exception { //public class FileUtilsTest {
//
} //
// @Test
// public void test_wordConvertPDF() throws Exception {
@Test // String filePath = "";
public void test_pdf2word() { // File file = FileUtils.wordConvertPDF(new File(filePath));
try { // System.out.println(DocumentLoad.loadPDF(file));
String pdfFile = "C:\\Users\\52747\\Documents\\dataset\\EMSD_Regulatory_Services_Handbook_LPG16.pdf"; // }
String wordFile = "C:\\Users\\52747\\Documents\\dataset\\EMSD_Regulatory_Services_Handbook_LPG16.doc"; //
// @Test
// 加载PDF文档 // public void test_word2html() throws Exception {
PDDocument pdfDoc = PDDocument.load(new File(pdfFile)); // String filePath = "C:\\Users\\52747\\Desktop\\test_motionDetailExport.docx";
int totalPages = pdfDoc.getNumberOfPages(); // String dataDir = "C:\\Users\\52747\\Desktop\\";
// Document doc = new Document(filePath);
// 使用追加模式打开Word文件 // HtmlSaveOptions opts = new HtmlSaveOptions(SaveFormat.HTML);
try (Writer writer = new OutputStreamWriter(new FileOutputStream(wordFile, true), "UTF-8")) { // opts.setHtmlVersion(HtmlVersion.HTML_5);
PDFTextStripper stripper = new PDFTextStripper(); // opts.setExportImagesAsBase64(true);
stripper.setSortByPosition(true); // opts.setExportPageMargins(true);
for (int i = 1; i <= totalPages; i++) { // doc.save(dataDir + "TestFile.html", opts);
stripper.setStartPage(i); // }
stripper.setEndPage(i); //
String pageText = stripper.getText(pdfDoc); // @Test
// public void test_pdf2word() {
// 追加当前页内容 // try {
writer.write(pageText); // String pdfFile = "C:\\Users\\52747\\Documents\\dataset\\EMSD_Regulatory_Services_Handbook_LPG16.pdf";
writer.write("\f"); // String wordFile = "C:\\Users\\52747\\Documents\\dataset\\EMSD_Regulatory_Services_Handbook_LPG16.doc";
} //
} // // 加载PDF文档
pdfDoc.close(); // PDDocument pdfDoc = PDDocument.load(new File(pdfFile));
System.out.println("总计追加 " + totalPages + " 页到现有文件"); // int totalPages = pdfDoc.getNumberOfPages();
} catch (IOException e) { //
System.err.println("转换失败:" + e.getMessage()); // // 使用追加模式打开Word文件
e.printStackTrace(); // try (Writer writer = new OutputStreamWriter(new FileOutputStream(wordFile, true), "UTF-8")) {
} // PDFTextStripper stripper = new PDFTextStripper();
} // stripper.setSortByPosition(true);
// for (int i = 1; i <= totalPages; i++) {
} // stripper.setStartPage(i);
// stripper.setEndPage(i);
// String pageText = stripper.getText(pdfDoc);
//
// // 追加当前页内容
// writer.write(pageText);
// writer.write("\f");
// }
// }
// pdfDoc.close();
// System.out.println("总计追加 " + totalPages + " 页到现有文件");
// } catch (IOException e) {
// System.err.println("转换失败:" + e.getMessage());
// e.printStackTrace();
// }
// }
//
//}
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment