index.js 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527
  1. const fs = require('fs')
  2. const path = require('path')
  3. const compressing = require('compressing')
  4. const rimrif = require('rimraf')
  5. const shell = require('shelljs');
  6. const crypto = require('crypto');
  7. // 文档模板生成
  8. const PizZip = require("pizzip");
  9. const Docxtemplater = require("docxtemplater");
  10. // 文档转换
  11. import { Chromiumly } from "chromiumly";
  12. // Chromiumly.configure({ endpoint: "http://8.140.98.43/docs" });
  13. Chromiumly.configure({ endpoint: "http://123.57.204.89/docs" });
  14. import { PDFEngines } from "chromiumly";
  15. const { LibreOffice } = require("chromiumly");
  16. // const { PDFEngines } = require("chromiumly");
  17. const tempDir = path.join(__dirname , "temp");
  18. if(!fs.existsSync(tempDir)){fs.mkdirSync(tempDir)};
  19. const OSS = require("ali-oss");
  20. const ALI_OSS_BUCKET = process.env.ALI_OSS_BUCKET || "hep-textbook"
  21. const ALI_OSS_ACCESS_KEY_ID = process.env.ALI_OSS_ACCESS_KEY_ID || "LTAI5t6AbTiAvXmeoVdJZhL3"
  22. const ALI_OSS_ACCESS_KEY_SECRET = process.env.ALI_OSS_ACCESS_KEY_SECRET || "KLtQRdIW69KLP7jnzHNUf7eKmdptxH"
  23. const bwipjs = require("bwip-js")
  24. export async function toBarCode(text){
  25. return new Promise(resolve=>{
  26. bwipjs.toBuffer({
  27. bcid:"code128",
  28. text:text,
  29. scale:1.5,
  30. height:3,
  31. includetext:false,
  32. textalign:"center"
  33. },(err,png)=>{
  34. if(err){
  35. console.error(err)
  36. resolve(null)
  37. }else{
  38. resolve(png)
  39. }
  40. })
  41. })
  42. }
  43. export async function uploadFileToOSS(filePath){
  44. let client = new OSS({
  45. // yourRegion填写Bucket所在地域。以华东1(杭州)为例,yourRegion填写为oss-cn-hangzhou。
  46. region: "oss-cn-beijing",
  47. accessKeyId: ALI_OSS_ACCESS_KEY_ID,
  48. accessKeySecret: ALI_OSS_ACCESS_KEY_SECRET,
  49. // 填写Bucket名称。
  50. bucket: ALI_OSS_BUCKET || "hep-textbook",
  51. });
  52. let now = new Date();
  53. let fileName = getFileName(filePath);
  54. let fileKey = `export/report/${fileName}`;
  55. const r1 = await client?.put(fileKey, filePath);
  56. console.log('put success: %j', r1);
  57. return r1
  58. }
  59. export function getFileName(filePath) {
  60. // 使用 '/' 或 '\' 作为分隔符,分割路径
  61. const parts = filePath.split(/[/\\]/);
  62. // 返回最后一个部分,即文件名
  63. return parts.pop();
  64. }
  65. module.exports.uploadFileToOSS = uploadFileToOSS
  66. /**
  67. * 将给定的文件路径数组打包成指定名称的zip压缩包
  68. * @param {Array<string>} filePathList - 要打包的文件路径数组
  69. * @param {string} outputZipName - 输出的zip文件名称
  70. */
  71. export function createZip(filePathList, outputZipName,options) {
  72. let zipStream = new compressing.zip.Stream();
  73. return new Promise((resolve)=>{
  74. try {
  75. let outputPath = path.join(options?.tempDir||tempDir,outputZipName)
  76. // 遍历文件路径列表,将每个文件添加到zip流中
  77. for (const filePath of filePathList) {
  78. // 检查文件是否存在
  79. if (fs.existsSync(filePath)) {
  80. // 将文件添加到zip流中
  81. zipStream.addEntry(filePath);
  82. } else {
  83. console.error(`文件不存在: ${filePath}`);
  84. }
  85. }
  86. // 创建一个写入流
  87. const output = fs.createWriteStream(outputPath);
  88. // 使用 compressing 库的 zip 方法将文件打包
  89. // console.log(filePathList)
  90. // await compressing.zip.compressDir(filePathList, output);
  91. // 将zip流写入文件
  92. zipStream.pipe(output);
  93. output.on('finish', () => {
  94. // console.log(`成功创建压缩包: ${outputPath}`);
  95. resolve(outputPath)
  96. });
  97. output.on('error', (error) => {
  98. console.error('写入压缩包时出错:', error);
  99. resolve(null)
  100. });
  101. // console.log(`成功创建压缩包: ${outputPath}`);
  102. // return outputPath
  103. } catch (error) {
  104. console.error('创建压缩包时出错:', error);
  105. return null
  106. }
  107. })
  108. }
  109. module.exports.createZip = createZip
  110. const download = require('download')
  111. async function downloadUrl(url,options) {
  112. // console.log(url)
  113. if(url?.startsWith("/")) {return url};
  114. let md5 = crypto.createHash('md5');
  115. let extname = path.extname(url)?.toLocaleLowerCase();
  116. let filename = md5.update(url).digest('hex') + extname;
  117. let filepath = path.join(options?.tempDir||tempDir,filename)
  118. // console.log(filename,filepath)
  119. try{
  120. // if(fs.existsSync(filepath)){fs.rmSync(filepath)} // 存在则删除
  121. if(fs.existsSync(filepath)){return filepath} // 存在则直接返回(md5相同)
  122. fs.writeFileSync(filepath, await download(url));
  123. return filepath
  124. }catch(err){
  125. console.error(err)
  126. return null
  127. }
  128. }
  129. /**
  130. * 将 DOCX 文件转换为 PDF
  131. *
  132. * @param {string} docxPath - 要转换的 DOCX 文件的路径
  133. * @param {string} outputPath - 输出 PDF 文件的路径
  134. * @returns {Promise<void>}
  135. */
  136. export async function docxToPdf(docxPath, outputPath,options) {
  137. let mergeFiles = options?.mergeFiles || []
  138. let merge = false;
  139. let mergeFileMap = {};
  140. if(mergeFiles?.length){
  141. let plist = []
  142. for (let index = 0; index < mergeFiles.length; index++) {
  143. let filePath
  144. plist.push((async ()=>{
  145. try{
  146. filePath = await downloadUrl(mergeFiles[index],options);
  147. }catch(err){}
  148. if(filePath){
  149. mergeFileMap[index] = filePath // 按原有顺序整理
  150. // filePathList.push(filePath)
  151. }
  152. return
  153. })())
  154. }
  155. await Promise.all(plist);
  156. merge = true;
  157. }
  158. let filePathList = mergeFiles?.map((item,index)=>mergeFileMap[index]).filter(item=>item)
  159. // console.log("DOWNLOADED:",filePathList)
  160. filePathList = filePathList.map((filepath,index)=>{
  161. // 按顺序修改文件前缀数字为字母表顺序
  162. let fileDir = path.dirname(filepath);
  163. let abc = String.fromCharCode(96+(index+1)); // 字母顺序不会出现 把 1 10 11 12 放在一起的情况
  164. let num = index+110; // 数字顺序从百位开始,避免首数字排序错乱
  165. let md5 = crypto.createHash('md5');
  166. let outmd5 = md5.update(path.basename(filepath)).digest('hex');
  167. let fileName = num + "_" + outmd5 + path.extname(filepath);
  168. let orderPath = path.join(fileDir,fileName)
  169. fs.cpSync(filepath,orderPath);
  170. fs.readFileSync(filepath);
  171. return orderPath
  172. })
  173. try {
  174. let files = []
  175. if(docxPath){
  176. let docxBuffer = fs.readFileSync(docxPath);
  177. files.push({ data: docxBuffer, ext: "docx" })
  178. }
  179. files = [...files,...filePathList]
  180. let convertOpts = {
  181. files,
  182. properties: {
  183. // 设置页面属性,例如纸张大小和方向
  184. pageSize: 'A4',
  185. // orientation: 'portrait',
  186. margin: {
  187. top: 0,
  188. right: 0,
  189. bottom: 0,
  190. left: 0
  191. }
  192. },
  193. pdfa: false, // 根据需要设置
  194. pdfUA: false, // 根据需要设置
  195. merge: merge, // 如果只转换一个文件,设置为false
  196. // metadata: {
  197. // // 你可以在这里添加元数据
  198. // },
  199. // losslessImageCompression: false,
  200. // reduceImageResolution: false,
  201. // quality: 90, // JPG 导出质量
  202. // maxImageResolution: 300 // 最大图像分辨率
  203. }
  204. // console.log("convertOpts",convertOpts)
  205. let pdfPath,pdfBuffer
  206. // 方式1:逐个合并
  207. // let pdfBuffer
  208. // for (let index = 1; index < files.length; index++) {
  209. // let file = files[index];
  210. // if(pdfBuffer){
  211. // convertOpts.files = [{data:pdfBuffer,ext:"pdf"},file]
  212. // }else{
  213. // convertOpts.files = [file]
  214. // }
  215. // pdfBuffer = await LibreOffice.convert(convertOpts);
  216. // }
  217. let mainPdfPath = docxPath
  218. if(docxPath){
  219. convertOpts.files = [files[0]];
  220. console.log(convertOpts)
  221. let mainPdfBuffer = await LibreOffice.convert(convertOpts);
  222. let md5 = crypto.createHash('md5');
  223. let outmd5 = md5.update(path.basename(docxPath)).digest('hex');
  224. mainPdfPath = path.dirname(docxPath)+"/109_"+outmd5+".pdf"
  225. fs.writeFileSync(mainPdfPath,mainPdfBuffer)
  226. }
  227. // 方式2:先合并pdf,后合并docx
  228. if(files?.length>4){
  229. let pdfList = [mainPdfPath,...files.slice(1)];
  230. pdfList = pdfList.filter(item=>item)
  231. let mergedFileList = await mergePdfListReduce(pdfList,convertOpts)
  232. pdfPath = mergedFileList[0];
  233. // convertOpts.files = [files[0],...mergedFileList]
  234. // console.log(convertOpts)
  235. // pdfBuffer = await LibreOffice.convert(convertOpts);
  236. }else{
  237. pdfBuffer = await LibreOffice.convert(convertOpts);
  238. }
  239. // 方式3:全部合并
  240. // let pdfBuffer = await LibreOffice.convert(convertOpts);
  241. if(pdfPath){
  242. fs.cpSync(pdfPath,outputPath);
  243. }
  244. // 将 Buffer 写入输出文件
  245. if(pdfBuffer){
  246. fs.writeFileSync(outputPath, pdfBuffer);
  247. console.log(`成功输出 ${outputPath}`);
  248. }
  249. return outputPath
  250. } catch (error) {
  251. console.error('转换失败:', error);
  252. return null
  253. }
  254. }
  255. module.exports.docxToPdf = docxToPdf
  256. const ImageModule = require("@slosarek/docxtemplater-image-module-free");
  257. const sizeOf = require("image-size");
  258. /**
  259. * 每三个pdf合并一次,直到合并为一个pdf为止
  260. * @param {} pdfList
  261. * @param {*} convertOpts
  262. * @returns
  263. */
  264. export async function mergePdfListReduce(pdfList,convertOpts){
  265. console.log("pdfList",pdfList)
  266. // 所有非PDF转PDF
  267. for (let index = 0; index < pdfList.length; index++) {
  268. let file = pdfList[index];
  269. if(typeof file == "string" && file?.toLocaleLowerCase()?.indexOf("pdf")==-1){
  270. convertOpts.files = [file];
  271. let pdfBuffer = await LibreOffice.convert(convertOpts);
  272. fs.writeFileSync(file+".pdf",pdfBuffer)
  273. pdfList[index] = file+".pdf"
  274. }
  275. }
  276. let mergeList = []
  277. let plist = []
  278. let length = pdfList.length
  279. for (let index = 0; index < length; index++) {
  280. let file = pdfList.shift();
  281. // console.log(file,index,length)
  282. if(!file) break;
  283. let files = [file,pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),
  284. pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),
  285. pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),
  286. pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),
  287. // pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),
  288. // pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),
  289. // pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),
  290. // ,pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift()
  291. // ,pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift()
  292. // ,pdfList.shift(),pdfList.shift(),pdfList.shift()
  293. // ,pdfList.shift(),pdfList.shift(),pdfList.shift()
  294. // ,pdfList.shift(),pdfList.shift(),pdfList.shift(),pdfList.shift()
  295. ]; // 每次合并四个
  296. files=files?.filter(item=>item);
  297. // console.log(files)
  298. plist.push(new Promise(async resolve=>{
  299. if(files?.length==1){ // 单文件直接加载 自动获取后缀
  300. let onefile = files[0]
  301. // if(!onefile?.ext){
  302. // let extname = path.extname(files[0]).slice(1)?.toLocaleLowerCase();
  303. // onefile = {data:fs.readFileSync(onefile),ext:extname}
  304. // }
  305. resolve(onefile);
  306. }else{ // 多文件合并
  307. convertOpts = {}
  308. convertOpts.files = files;
  309. // console.log("多文件合并",convertOpts)
  310. // pdfEngine合并
  311. if(false){
  312. let mergeBuffer = await PDFEngines.merge(convertOpts)
  313. let mergeFilePath = files[0]+".merge.pdf"
  314. fs.writeFileSync(mergeFilePath,mergeBuffer)
  315. resolve(mergeFilePath)
  316. }
  317. // pdfunite合并
  318. if(true){
  319. let mergeFilePath = files[0]+".merge.pdf"
  320. pdfUnite(files,mergeFilePath)
  321. resolve(mergeFilePath)
  322. }
  323. }
  324. }))
  325. }
  326. if(plist?.length){
  327. mergeList = await Promise.all(plist);
  328. }
  329. // console.log("mergeList",mergeList)
  330. if(mergeList?.length<=1){
  331. return mergeList;
  332. }else{
  333. // console.log("mergePdfListReduce continue:",mergeList)
  334. return await mergePdfListReduce(mergeList,convertOpts)
  335. }
  336. }
  337. function pdfUnite(pdfList,outputPath){
  338. let params = ["pdfunite",...pdfList,outputPath].join(" ")
  339. try{
  340. shell.exec(params)
  341. }catch(err){}
  342. if(fs.existsSync(outputPath)){
  343. return outputPath
  344. }else{
  345. throw "error: pdfunit merge error"
  346. }
  347. }
  348. export function renderDocx(inputDocxPath, outputDocxName, data,options){
  349. let imageOptions = {
  350. getImage(tagValue,tagName) {
  351. if(!fs.existsSync(tagValue)){
  352. throw new Error(`Image not found: ${tagValue}`);
  353. }
  354. return fs.readFileSync(tagValue);
  355. },
  356. getSize(img) {
  357. const sizeObj = sizeOf(img);
  358. console.log(sizeObj);
  359. return [sizeObj.width, sizeObj.height];
  360. },
  361. };
  362. let outputDocxPath = path.join(options?.tempDir||tempDir,outputDocxName)
  363. // Load the docx file as binary content
  364. let content = fs.readFileSync(
  365. inputDocxPath,
  366. "binary"
  367. );
  368. // Unzip the content of the file
  369. let zip = new PizZip(content);
  370. let doc = new Docxtemplater(zip, {
  371. paragraphLoop: true,
  372. linebreaks: true,
  373. modules: [new ImageModule(imageOptions)],
  374. });
  375. // Render the document (Replace {first_name} by John, {last_name} by Doe, ...)
  376. Object.keys(data).forEach(key=>{ // 除去空值
  377. if(data[key]==undefined){
  378. data[key] = ""
  379. }
  380. })
  381. doc.render(data);
  382. // Get the zip document and generate it as a nodebuffer
  383. let buf = doc.getZip().generate({
  384. type: "nodebuffer",
  385. // compression: DEFLATE adds a compression step.
  386. // For a 50MB output document, expect 500ms additional CPU time
  387. compression: "DEFLATE",
  388. });
  389. // buf is a nodejs Buffer, you can either write it to a
  390. // file or res.send it with express for example.
  391. fs.writeFileSync(outputDocxPath, buf);
  392. return outputDocxPath
  393. }
  394. /**
  395. * docx 替换模板字符串内容
  396. * @example
  397. // 要替换内容的模板
  398. let inputDocx = 'cs.docx'
  399. // 替换完成的docx文件
  400. let outputDocx = 'dd.docx'
  401. // {{xx}} 处要替换的内容
  402. let replaceData = {
  403. name: '替换name处的内容',
  404. age: '替换age处的内容',
  405. }
  406. replaceDocx(inputDocx, outputDocx, replaceData)
  407. */
  408. export function replaceDocx(inputDocxPath, outputDocxPath, options,eventMap) {
  409. return new Promise((resolve,reject)=>{
  410. // 解压出来的临时目录
  411. let md5 = crypto.createHash('md5');
  412. let outmd5 = md5.update(outputDocxPath).digest('hex')
  413. let tempDocxPath = path.join(options?.tempDir||tempDir , outmd5)
  414. // 要替换的xml文件位置
  415. let tempDocxXMLName = path.join(tempDocxPath,`word/document.xml`)
  416. // 压缩文件夹为文件
  417. let dir_to_docx = (inputFilePath, outputFilePath) => {
  418. outputFilePath = path.join(options?.tempDir||tempDir,outputFilePath)
  419. // 创建压缩流
  420. let zipStream = new compressing.zip.Stream()
  421. // 写出流
  422. let outStream = fs.createWriteStream(outputFilePath)
  423. fs.readdir(inputFilePath, null, (err, files) => {
  424. if (!err) {
  425. files.map(file => path.join(inputFilePath, file))
  426. .forEach(file => {
  427. zipStream.addEntry(file)
  428. })
  429. }
  430. })
  431. // 写入文件内容
  432. zipStream.pipe(outStream)
  433. .on('close', () => {
  434. // 打包完成后删除临时目录
  435. // console.log(tempDocxPath)
  436. eventMap["onDocxComplete"]&&eventMap["onDocxComplete"](outputFilePath)
  437. shell.rm("-r",tempDocxPath)
  438. // rimrif.rimrafSync(tempDocxPath)
  439. resolve(true)
  440. })
  441. }
  442. // 替换word/document.xml文件中{{xx}}处的内容
  443. let replaceXML = (data, text) => {
  444. Object.keys(data).forEach(key => {
  445. text = text.replaceAll(`{{${key}}}`, data[key])
  446. })
  447. return text
  448. }
  449. // 解压docx文件替换内容重新打包成docx文件
  450. compressing.zip.uncompress(inputDocxPath, tempDocxPath)
  451. .then(() => {
  452. // 读写要替换内容的xml文件
  453. fs.readFile(tempDocxXMLName, null, (err, data) => {
  454. if (!err) {
  455. let text = data.toString()
  456. text = replaceXML(options, text)
  457. fs.writeFile(tempDocxXMLName, text, (err) => {
  458. if (!err) {
  459. dir_to_docx(tempDocxPath, outputDocxPath)
  460. } else {
  461. reject(err)
  462. }
  463. })
  464. } else {
  465. reject(err)
  466. }
  467. })
  468. }).catch(err => {
  469. reject(err)
  470. })
  471. })
  472. }
  473. module.exports.replaceDocx = replaceDocx
  474. function generateObjectId(inputString) {
  475. inputString = inputString || ""
  476. inputString = String(inputString)
  477. const hash = crypto.createHash('sha256').update(inputString).digest('hex');
  478. const objectId = hash;
  479. return objectId;
  480. }