(*非目录项*)
$precontent=“Geometric Measure Theory —- An Introduction…..1
Series Preface…….3
Introduction…….5
Acknowledgements…….9
Contents…….11″;
$firstpagenumber=13;
(*pdf导出的目录*)
$contentsall=“从pdf文件把目录内容复制粘贴进来”;
(*处理非标准目录, 我定义了一些规则, 你可以自己添加*)
sametostop[ini_?StringQ,beg_?StringQ,end_?StringQ]:=Module[{i=1,tini=ini,tbeg=beg,tend=end,temp},
While[
tbeg!=tend&& i<= 100,
temp=StringReplace[tbeg,RegularExpression[“[\”\[Bullet]]”]->“.”];
temp=StringReplace[temp,RegularExpression[“[\r\n]\\.\\s*\\.”]->“.”];
temp=StringReplace[temp,RegularExpression[“[a-zA-Z]+\\s*[\r\n][a-zA-Z]+”]->“.”];
temp=StringReplace[temp,“\[CenterDot]”->“.”];
temp=StringReplace[temp,“..”-> “. . “];
temp=StringReplace[temp,RegularExpression[“(\\d\\.)\\s+(\\d)”]->“$1”~~“$2”];
i++;
tend=tbeg;
tbeg=temp;
]
tend]
(*输出为标准的djvu能够识别的格式*)
reformart[sec_?StringQ, con_?StringQ, pgnum_?StringQ] :=
Module[{len = Length[StringCases[sec, “.”]], pref = “(“, suff = “)”,
midd = ” \”” ~~ sec ~~ ” “ ~~ con ~~ “\” \”#” ~~ pgnum ~~ “\””},
Switch[len,
0, pref ~~ midd ~~ suff,
1, pref ~~ midd ~~ suff,
2, pref ~~ midd ~~ suff,
3, pref ~~ midd ~~ suff
]
]
(*最终的目录数据, 可以直接被djvused处理*)
$sectionprecontent=StringCases[$precontent,RegularExpression[“([a-zA-Z]+)\\.+(\\d+)”]:> reformart[“”,“$1”,ToString[ToExpression[“$2”]]]]//ColumnForm
$contentsall=sametostop[$contentsall,$contentsall,“”]//ToString;
$sectionlist=StringCases[
$contentsall,RegularExpression[“(.*?)((\\.\\s*){2,})(\\d+)[\\r\\n]*?”]:> reformart[“”,“$1”,ToString[ToExpression[“$4”]+$firstpagenumber–1]]];
List[“(bookmarks”,$sectionprecontent,$sectionlist,“)”]//Flatten//ColumnForm
发表回复