请参阅: java : pdfbox 读取 PDF文件内书签
npm install elementtree --save
编写 txt_etree_mm.js 如下
// 读目录.txt文件,使用 elementtree 生成思维导图 Freemind(.mm)文件
var fs = require('fs');
var process = require('process');
var path = require('path');
var readline = require('readline');
var et = require('elementtree');
var XML = et.XML;
var ElementTree = et.ElementTree;
var element = et.Element;
var subElement = et.SubElement;
if (process.argv.length <3){
console.error("usage: node txt_etree.mm.js file1.txt");
return 1;
}
var file1 = process.argv[2]
let stat = fs.statSync(file1);
if (!stat.isFile()) {
console.error("it is not File.");
return 2;
}
let ext = path.extname(file1);
if (ext.toLowerCase() != '.txt'){
console.error(ext +" is not .txt");
return 3;
}
var file2 = file1.replace('.txt', '.mm');
console.log(file2);
var fRead = fs.createReadStream(file1);
var fWrite = fs.createWriteStream(file2);
// 创建readline接口实例
var rline = readline.createInterface({
input: fRead,
// output: fWrite,
terminal: true
});
var txt, map1, root, edge, node1, node2, node3, node4, node5;
// 创建 map节点
map1 = element('map');
map1.set('version', '1.0.1');
// 用缩排表现层级关系,假设最多5个层级
// line 事件
var n =1;
rline.on('line', function(line){
txt = line.trim();
if (n ==1){
// 读取第一行:书名
// 创建主题节点
root = subElement(map1, "node");
root.set('ID', '1');
root.set('STYLE', 'bubble'); // 泡框
root.set('TEXT', txt);
// 定义连线的颜色:红色
edge = subElement(root, "edge")
edge.set('COLOR', "#ff0000")
}
txt = txt.slice(0,-3); // 去掉行尾的页数
if (txt.length ==0 || n==1) ;
else if (txt.length >0 && line.slice(0,1) !=' '){
// 创建主题的子节点(1级节点)
node1 = subElement(root, "node");
node1.set('ID', String(n));
node1.set('POSITION', "right");
node1.set('TEXT', txt);
p_node = node1; // 寄存父节点
}
else if (line.startsWith(" ") && line.slice(2,3) !=' '){
// 创建node1的子节点(2级节点)
if (node1) node2 = subElement(node1, "node");
else node2 = subElement(root, "node");
node2.set('ID', String(n));
node2.set('TEXT', txt);
p_node = node2;
}
else if (line.startsWith(" ") && line.slice(4,5) !=' '){
// 创建node2的子节点(3级节点)
if (node2) node3 = subElement(node2, "node");
else if(node1) node3 = subElement(node1, "node");
else node3 = subElement(root, "node");
node3.set('FOLDED', "true");
node3.set('ID', String(n));
node3.set('TEXT', txt);
p_node = node3;
}
else if (line.startsWith(" ") && line.slice(6,7) !=' '){
// 创建node3的子节点(4级节点)
if (node3) node4 = subElement(node3, "node");
else if (node2) node4 = subElement(node2, "node");
else if (node1) node4 = subElement(node1, "node");
else node4 = subElement(root, "node");
node4.set('ID', String(n));
node4.set('TEXT', txt);
p_node = node4;
}
else if (line.startsWith(" ") && line.slice(8,9) !=' '){
// 创建node4的子节点(5级节点)
if (node4) node5 = subElement(node4, "node");
else if (p_node) node5 = subElement(p_node, "node");
else node5 = subElement(root, "node");
node5.set('ID', String(n));
node5.set('TEXT', txt);
}
else {
console.log(txt);
}
n = n+1;
});
var etree, xml;
rline.on('close', function(){
etree = new ElementTree(map1);
xml = etree.write({'xml_declaration': false});
//console.log(xml);
fWrite.write(xml);
});
运行 node txt_etree.mm.js your_pdf_dir.txt