123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188 |
- { Copyright (C) <2005> <Andrew Haines> chmfilewriter.pas
- This library is free software; you can redistribute it and/or modify it
- under the terms of the GNU Library General Public License as published by
- the Free Software Foundation; either version 2 of the License, or (at your
- option) any later version.
- This program is distributed in the hope that it will be useful, but WITHOUT
- ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
- FITNESS FOR A PARTICULAR PURPOSE. See the GNU Library General Public License
- for more details.
- You should have received a copy of the GNU Library General Public License
- along with this library; if not, write to the Free Software Foundation,
- Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
- }
- {
- See the file COPYING.FPC, included in this distribution,
- for details about the copyright.
- }
- unit chmfilewriter;
- {$mode objfpc}{$H+}
- interface
- uses
- Strings, Classes, SysUtils, chmwriter, inifiles, contnrs, chmsitemap, avl_tree,
- {for html scanning } dom,SAX_HTML,dom_html;
- type
- TChmProject = class;
- TChmProjectErrorKind = (chmerror,chmwarning,chmhint,chmnote,chmnone);
- TChmProgressCB = procedure (Project: TChmProject; CurrentFile: String) of object;
- TChmErrorCB = procedure (Project: TChmProject;errorkind:TChmProjectErrorKind;msg:String;detaillevel:integer=0);
- { TChmProject }
- TChmProject = class
- private
- FAutoFollowLinks: Boolean;
- FDefaultFont: String;
- FDefaultPage: String;
- FFiles: TStrings;
- FIndexFileName: String;
- FMakeBinaryTOC: Boolean;
- FMakeBinaryIndex: Boolean;
- FMakeSearchable: Boolean;
- FFileName: String;
- FOnProgress: TChmProgressCB;
- FOnError : TChmErrorCB;
- FOutputFileName: String;
- FTableOfContentsFileName: String;
- FTitle: String;
- FWindows : TObjectList;
- FMergeFiles : TStringlist;
- fDefaultWindow : string;
- fScanHtmlContents : Boolean;
- fOtherFiles : TStrings; // Files found in a scan.
- fAllowedExtensions: TStringList;
- fTotalFileList : TAvlTree;
- fAnchorList : TStringList;
- FSpareString : TStringIndex;
- FBasePath : String; // location of the .hhp file. Needed to resolve relative paths
- FReadmeMessage : String; // readme message
- FToc,
- FIndex : TCHMSiteMap;
- FTocStream,
- FIndexStream : TMemoryStream;
- protected
- function GetData(const DataName: String; out PathInChm: String; out FileName: String; var Stream: TStream): Boolean;
- procedure LastFileAdded(Sender: TObject);
- procedure readIniOptions(keyvaluepairs:tstringlist);
- procedure ScanHtml;
- procedure ScanList(toscan,newfiles:TStrings;recursion:boolean);
- procedure ScanSitemap(sitemap:TChmSiteMap;newfiles:TStrings;recursion:boolean);
- function FileInTotalList(const s:String):boolean;
- function SanitizeURL(const basepath, instring, localpath, localname:string; var outstring:String):Boolean;
- public
- constructor Create; virtual;
- destructor Destroy; override;
- procedure LoadFromFile(AFileName: String); virtual;
- procedure LoadFromhhp (AFileName:String;LeaveInclude:Boolean); virtual;
- procedure SaveToFile(AFileName: String); virtual;
- procedure WriteChm(AOutStream: TStream); virtual;
- procedure ShowUndefinedAnchors;
- function ProjectDir: String;
- procedure LoadSitemaps;
- procedure AddFileWithContext(contextid:integer;filename:ansistring;contextname:ansistring='');
- procedure Error(errorkind:TChmProjectErrorKind;msg:String;detaillevel:integer=0);
- // though stored in the project file, it is only there for the program that uses the unit
- // since we actually write to a stream
- property OutputFileName: String read FOutputFileName write FOutputFileName;
- property FileName: String read FFileName write FFileName;
- property Files: TStrings read FFiles write FFiles; // html files
- property OtherFiles: TStrings read FOtherFiles write FOtherFiles; // other files (.css, img etc)
- property AutoFollowLinks: Boolean read FAutoFollowLinks write FAutoFollowLinks;
- property TableOfContentsFileName: String read FTableOfContentsFileName write FTableOfContentsFileName;
- property MakeBinaryTOC: Boolean read FMakeBinaryTOC write FMakeBinaryTOC;
- property MakeBinaryIndex: Boolean read FMakeBinaryIndex write FMakeBinaryIndex;
- property Title: String read FTitle write FTitle;
- property IndexFileName: String read FIndexFileName write FIndexFileName;
- property MakeSearchable: Boolean read FMakeSearchable write FMakeSearchable;
- property DefaultPage: String read FDefaultPage write FDefaultPage;
- property DefaultFont: String read FDefaultFont write FDefaultFont;
- property Windows :TObjectList read FWindows write FWindows;
- property MergeFiles :TStringlist read FMergeFiles write FMergefiles;
- property OnProgress: TChmProgressCB read FOnProgress write FOnProgress;
- property OnError : TChmErrorCB read FOnError write FOnError;
- property DefaultWindow : String read FDefaultWindow write FDefaultWindow;
- property ScanHtmlContents : Boolean read fScanHtmlContents write fScanHtmlContents;
- property ReadmeMessage : String read FReadmeMessage write FReadmeMessage;
- property AllowedExtensions : TStringList read FAllowedExtensions;
- end;
- TChmContextNode = Class
- URLName : AnsiString;
- ContextNumber : Integer;
- ContextName : AnsiString;
- End;
- Const
- ChmErrorKindText : array[TCHMProjectErrorKind] of string = ('Error','Warning','Hint','Note','');
- implementation
- uses XmlCfg, CHMTypes;
- type
- { TFirstReference }
- TFirstReference = class
- public
- Location: string;
- constructor Create(Const ALocation: string);
- end;
- { TFirstReference }
- constructor TFirstReference.Create(const ALocation: string);
- begin
- Location := ALocation;
- end;
- { TChmProject }
- function TChmProject.GetData(const DataName: String; out PathInChm: String; out
- FileName: String; var Stream: TStream): Boolean;
- begin
- Result := False; // Return true to abort compressing files
- TMemoryStream(Stream).LoadFromFile(ProjectDir+DataName);
- // clean up the filename
- FileName := StringReplace(ExtractFileName(DataName), '\', '/', [rfReplaceAll]);
- FileName := StringReplace(FileName, '//', '/', [rfReplaceAll]);
- PathInChm := '/'+ExtractFilePath(DataName);
- if Assigned(FOnProgress) then FOnProgress(Self, DataName);
- end;
- procedure TChmProject.LastFileAdded(Sender: TObject);
- var
- Writer: TChmWriter;
- begin
- // Assign the TOC and index files
- Writer := TChmWriter(Sender);
- {$ifdef chmindex}
- Writeln('binindex filename ',IndexFileName);
- {$endif}
- if assigned(FIndexStream) then
- begin
- FIndexStream.position:=0;
- Writer.AppendIndex(FIndexStream);
- if MakeBinaryIndex then
- begin
- {$ifdef chmindex}
- Writeln('into binindex ');
- {$endif}
- Writer.AppendBinaryIndexFromSiteMap(FIndex,False);
- end;
- end;
- if assigned(FTocStream) then
- begin
- Writer.AppendTOC(FTOCStream);
- if MakeBinaryTOC then
- begin
- Writer.AppendBinaryTOCFromSiteMap(FToc);
- end;
- end;
- if not assigned(sender) then
- Writer.Free;
- end;
- constructor TChmProject.Create;
- begin
- FFiles := TStringList.Create;
- FOtherFiles := TStringList.Create;
- FAllowedExtensions:=TStringList.Create;
- FAllowedExtensions.add('.HTM');
- FAllowedExtensions.add('.HTML');
- FWindows:=TObjectList.Create(True);
- FMergeFiles:=TStringlist.Create;
- ScanHtmlContents:=False;
- FTotalFileList:=TAvlTree.Create(@CompareStrings);
- FSparestring :=TStringIndex.Create;
- fAnchorList := TStringList.Create;
- fAnchorList.Sorted := True;
- fAnchorList.OwnsObjects := True;
- end;
- destructor TChmProject.Destroy;
- var i : integer;
- begin
- for i:=0 to ffiles.count -1 do
- ffiles.objects[i].free;
- FMergeFiles.Free;
- FFiles.Free;
- FOtherFiles.Free;
- FWindows.Free;
- FSpareString.Free;
- FTotalFileList.FreeAndClear;
- FTotalFileList.Free;
- fAllowedExtensions.Free;
- FToc.free;
- FIndex.free;
- FTocStream.Free;
- FIndexStream.Free;
- fAnchorList.Free;
- inherited Destroy;
- end;
- Type
- TSectionEnum = (secOptions,secWindows,secFiles,secMergeFiles,secAlias,secMap,secInfoTypes,secTextPopups,secUnknown);
- TOptionEnum = (OPTAUTO_INDEX,OPTAUTO_TOC,OPTBINARY_INDEX,OPTBINARY_TOC,OPTCITATION,
- OPTCOMPRESS,OPTCOPYRIGHT,OPTCOMPATIBILITY,OPTCOMPILED_FILE,OPTCONTENTS_FILE,
- OPTCREATE_CHI_FILE,OPTDBCS,OPTDEFAULT_FONT,OPTDEFAULT_WINDOW,OPTDEFAULT_TOPIC,
- OPTDISPLAY_COMPILE_NOTES,OPTDISPLAY_COMPILE_PROGRESS,OPTENHANCED_DECOMPILATION,OPTERROR_LOG_FILE,OPTFLAT,
- OPTFULL_TEXT_SEARCH_STOP_LIST,OPTFULL_TEXT_SEARCH,OPTIGNORE,OPTINDEX_FILE,OPTLANGUAGE,OPTPREFIX,
- OPTSAMPLE_STAGING_PATH,OPTSAMPLE_LIST_FILE,OPTTMPDIR,OPTTITLE,OPTCUSTOM_TAB,OPTUNKNOWN);
- Const
- SectionNames : Array[TSectionEnum] of String =
- ('OPTIONS','WINDOWS','FILES','MERGE FILES','ALIAS','MAP','INFOTYPES','TEXT POPUPS','UNKNOWN');
- OptionKeys : array [TOptionEnum] of String =
- ('AUTO INDEX','AUTO TOC','BINARY INDEX','BINARY TOC','CITATION',
- 'COMPRESS','COPYRIGHT','COMPATIBILITY','COMPILED FILE','CONTENTS FILE',
- 'CREATE CHI FILE','DBCS','DEFAULT FONT','DEFAULT WINDOW','DEFAULT TOPIC',
- 'DISPLAY COMPILE NOTES','DISPLAY COMPILE PROGRESS','ENHANCED DECOMPILATION','ERROR LOG FILE','FLAT',
- 'FULL-TEXT SEARCH STOP LIST','FULL-TEXT SEARCH','IGNORE','INDEX FILE','LANGUAGE','PREFIX',
- 'SAMPLE STAGING PATH','SAMPLE LIST FILE','TMPDIR','TITLE','CUSTOM TAB','UNKNOWN');
- function FindSectionName (const name:string):TSectionEnum;
- begin
- result:=low(TSectionEnum);
- while (result<secUnknown) and (name<>SectionNames[Result]) do
- inc(result);
- end;
- function FindOptionName(Const name:string):TOptionEnum;
- begin
- result:=low(TOptionEnum);
- while (result<optUnknown) and (name<>OptionKeys[Result]) do
- inc(result);
- end;
- procedure TChmProject.readIniOptions(keyvaluepairs:tstringlist);
- var i : integer;
- Opt : TOptionEnum;
- OptVal,
- OptValUpper : string;
- begin
- for i:=0 to keyvaluepairs.count-1 do
- begin
- Opt:=findoptionname(uppercase(keyvaluepairs.names[i]));
- optval :=keyvaluepairs.valuefromindex[i];
- optvalupper:=uppercase(OptVal);
- case Opt Of
- OPTAUTO_INDEX : ;
- OPTAUTO_TOC : ;
- OPTBINARY_INDEX : MakeBinaryIndex:=optvalupper='YES';
- OPTBINARY_TOC : MakeBinaryToc :=optvalupper='YES';
- OPTCITATION : ;
- OPTCOMPRESS : ; // Doesn't seem to have effect in workshop
- OPTCOPYRIGHT : ;
- OPTCOMPATIBILITY : ;
- OPTCOMPILED_FILE : OutputFilename:=optval;
- OPTCONTENTS_FILE : TableOfContentsFileName:=optval;
- OPTCREATE_CHI_FILE : ;
- OPTDBCS : ; // What this field makes unicode is not known?
- OPTDEFAULT_FONT : defaultfont:=optval;
- OPTDEFAULT_WINDOW : defaultwindow:=optval;
- OPTDEFAULT_TOPIC : defaultpage:=optval;
- OPTDISPLAY_COMPILE_NOTES : ;
- OPTDISPLAY_COMPILE_PROGRESS : ;
- OPTENHANCED_DECOMPILATION : ;
- OPTERROR_LOG_FILE : ;
- OPTFLAT : ;
- OPTFULL_TEXT_SEARCH_STOP_LIST: ;
- OPTFULL_TEXT_SEARCH : MakeSearchable:=optvalupper='YES';
- OPTIGNORE : ;
- OPTINDEX_FILE : Indexfilename:=optval;
- OPTLANGUAGE : ;
- OPTPREFIX : ; // doesn't seem to have effect
- OPTSAMPLE_STAGING_PATH : ;
- OPTSAMPLE_LIST_FILE : ;
- OPTTMPDIR : ;
- OPTTITLE : Title:=optval;
- OPTCUSTOM_TAB : ;
- OPTUNKNOWN : ; // can be used for errors on unknown keys
- end;
- end;
- end;
- procedure TChmProject.LoadFromFile(AFileName: String);
- var
- Cfg: TXMLConfig;
- MergeFileCount,
- WinCount,
- FileCount: Integer;
- I : Integer;
- nd : TChmContextNode;
- win: TCHMWindow;
- s : String;
- begin
- Cfg := TXMLConfig.Create(nil);
- Cfg.Filename := AFileName;
- FileName := AFileName;
- FBasePath:=extractfilepath(expandfilename(afilename));
- Files.Clear;
- FileCount := Cfg.GetValue('Files/Count/Value', 0);
- for I := 0 to FileCount-1 do
- begin
- nd:=TChmContextNode.Create;
- nd.urlname:=Cfg.GetValue('Files/FileName'+IntToStr(I)+'/Value','');
- nd.contextnumber:=Cfg.GetValue('Files/FileName'+IntToStr(I)+'/ContextNumber',0);
- nd.contextname:=Cfg.GetValue('Files/FileName'+IntToStr(I)+'/ContextName','');
- Files.AddObject(nd.URLNAME,nd);
- end;
- FileCount := Cfg.GetValue('OtherFiles/Count/Value', 0);
- for I := 0 to FileCount-1 do
- begin
- s:=Cfg.GetValue('OtherFiles/FileName'+IntToStr(I)+'/Value','');
- OtherFiles.Add(s);
- end;
- WinCount:= Cfg.GetValue('Windows/Count/Value', 0);
- for i:=0 To WinCount-1 do
- begin
- win:=TCHMWindow.Create;
- win.loadfromxml(cfg,'Windows/item'+inttostr(i)+'/');
- fwindows.add(win);
- end;
- Mergefilecount:=Cfg.getValue('MergeFiles/Count/Value', 0);
- for i:=0 To MergeFileCount-1 do
- Mergefiles.add(Cfg.getValue('MergeFiles/FileName'+IntToStr(I)+'/value',''));
- // load some values that changed key backwards compatible.
- IndexFileName := Cfg.GetValue('Files/IndexFile/Value','');
- if IndexFileName='' Then
- IndexFileName := Cfg.GetValue('Settings/IndexFile/Value','');
- TableOfContentsFileName := Cfg.GetValue('Files/TOCFile/Value','');
- If TableOfContentsFileName='' then
- TableOfContentsFileName := Cfg.GetValue('Settings/TOCFile/Value','');
- // For chm file merging, bintoc must be false and binindex true. Change defaults in time?
- // OTOH, merging will be mostly done for fpdoc files, and that doesn't care about defaults.
- S:=Cfg.GetValue('Files/MakeBinaryTOC/Value', '');
- if s='' Then
- MakeBinaryTOC := Cfg.GetValue('Settings/MakeBinaryTOC/Value', True)
- else
- MakeBinaryTOC := Cfg.GetValue('Files/MakeBinaryTOC/Value', True);
- S:=Cfg.GetValue('Files/MakeBinaryIndex/Value', '');
- if s='' Then
- MakeBinaryIndex := Cfg.GetValue('Settings/MakeBinaryIndex/Value', False)
- else
- MakeBinaryIndex := Cfg.GetValue('Files/MakeBinaryIndex/Value', False);
- AutoFollowLinks := Cfg.GetValue('Settings/AutoFollowLinks/Value', False);
- MakeSearchable := Cfg.GetValue('Settings/MakeSearchable/Value', False);
- DefaultPage := Cfg.GetValue('Settings/DefaultPage/Value', '');
- Title := Cfg.GetValue('Settings/Title/Value', '');
- OutputFileName := Cfg.GetValue('Settings/OutputFileName/Value', '');
- DefaultFont := Cfg.GetValue('Settings/DefaultFont/Value', '');
- DefaultWindow:= Cfg.GetValue('Settings/DefaultWindow/Value', '');
- ScanHtmlContents:= Cfg.GetValue('Settings/ScanHtmlContents/Value', False);
- Cfg.Free;
- end;
- function cleanupstring(const s:string):string;
- var
- i:integer;
- begin
- i:=pos(';',s);
- if i>0 then
- result:=trim(copy(s,1,i-1))
- else
- result:=trim(s);
- end;
- procedure TChmProject.LoadFromhhp (AFileName:String;LeaveInclude:Boolean);
- // leaveinclude=true leaves includefiles includefiles.
- procedure addalias(const key,value :string);
- var i,j : integer;
- node: TCHMContextNode;
- keyupper,valueupper : string;
- begin
- { Defaults other than global }
- MakeBinaryIndex:=True;
- {$ifdef hhp_debug}
- writeln('alias entry:',key,'=',value);
- {$endif}
- keyupper:=uppercase(value);
- i:=0; j:=files.count;
- while (i<j) and (uppercase(TCHMContextnode(files.objects[i]).UrlName)<>keyupper) do
- inc(i);
- if i=j then
- begin
- {$ifdef hhp_debug}
- writeln('alias new node:',key);
- {$endif}
- node:=TCHMContextNode.create;
- valueupper:=stringReplace(value, '\', '/', [rfReplaceAll]);
- valueupper:= StringReplace(valueupper, '//', '/', [rfReplaceAll]);
- node.URLName:=valueupper;
- node.contextname:=key;
- end
- else
- begin
- node:=TCHMContextNode(Files.objects[i]);
- node.ContextName:=key;
- end;
- end;
- procedure processalias(strs:TStringlist);
- var i,j : integer;
- s : string;
- strls2:tstringlist;
- begin
- for i:=0 to strs.count-1 do
- begin
- s:=cleanupstring(strs[i]);
- if uppercase(copy(s,1,8))='#INCLUDE' then
- begin
- delete(s,1,8);
- s:=trim(s);
- if fileexists(s) then
- begin
- strls2:=TstringList.create;
- strls2.loadfromfile(s);
- processalias(strls2);
- strls2.free;
- end;
- end
- else
- begin
- s:=cleanupstring(s);
- j:=pos('=',s);
- if j>0 then
- addalias(trim(copy(s,1,j-1)),copy(s,j+1,length(s)-j));
- end;
- end;
- end;
- procedure addmap(const key,value :string);
- var i,j : integer;
- node: TCHMContextNode;
- keyupper : string;
- begin
- {$ifdef hhp_debug}
- writeln('map entry:',key,'=',value);
- {$endif}
- keyupper:=uppercase(key);
- i:=0; j:=files.count;
- while (i<j) and (uppercase(TCHMContextnode(files.objects[i]).contextname)<>keyupper) do
- inc(i);
- if i=j then
- raise Exception.create('context "'+key+'" not found!')
- else
- begin
- node:=TCHMContextNode(Files.objects[i]);
- node.Contextnumber:=strtointdef(value,0);
- end;
- end;
- procedure processmap(strs:TStringlist);
- var i,j : integer;
- s : string;
- strls2:tstringlist;
- begin
- for i:=0 to strs.count-1 do
- begin
- s:=cleanupstring(strs[i]);
- {$ifdef hhp_debug}
- writeln('map item:',s);
- {$endif}
- if uppercase(copy(s,1,8))='#INCLUDE' then
- begin
- delete(s,1,8);
- s:=trim(s);
- if fileexists(s) then
- begin
- strls2:=TstringList.create;
- strls2.loadfromfile(s);
- processmap(strls2);
- strls2.free;
- end;
- end
- else
- begin
- s:=cleanupstring(s);
- if uppercase(copy(s,1,7))='#DEFINE' Then
- begin
- delete(s,1,7);
- s:=trim(s);
- j:=pos(' ',s);
- if j>0 then
- addmap(trim(copy(s,1,j-1)),copy(s,j+1,length(s)-j));
- end
- else
- begin
- {$ifdef hhp_debug}
- writeln('map leftover:',s);
- {$endif}
- end;
- end;
- end;
- end;
- var
- Fini : TMemIniFile; // TMemInifile is more compatible with Delphi. Delphi's API based TIniFile fails on .hhp files.
- secs,strs : TStringList;
- i,j : Integer;
- section : TSectionEnum;
- nd : TChmContextNode;
- begin
- { Defaults other than global }
- MakeBinaryIndex:=True;
- FBasePath:=extractfilepath(expandfilename(afilename));
- Fini:=TMeminiFile.Create(AFileName);
- secs := TStringList.create;
- strs := TStringList.create;
- fini.readsections(secs);
- // Do the files section first so that we can emit errors if
- // other sections reference unknown files.
- fini.readsectionvalues(SectionNames[secFiles] ,strs);
- if strs.count>0 then
- for j:=0 to strs.count-1 do
- begin
- nd:=TChmContextNode.Create;
- nd.urlname:=StringReplace(strs[j],'\', '/', [rfReplaceAll]);
- nd.contextnumber:=0;
- nd.contextname:='';
- Files.AddObject(nd.urlname,nd);
- end;
- // aliases also add file nodes.
- fini.readsectionvalues(SectionNames[secAlias] ,strs); // resolve all aliases.
- if strs.count>0 then
- processalias(strs);
- // map files only add to existing file nodes.
- fini.readsectionvalues(SectionNames[secmap] ,strs);
- if strs.count>0 then
- processmap(strs);
- for i:=0 to secs.count-1 do
- begin
- section:=FindSectionName(Uppercase(Secs[i]));
- if section<>secunknown then
- fini.readsectionvalues(secs[i] ,strs);
- case section of
- secOptions : readinioptions(strs);
- secWindows : for j:=0 to strs.count-1 do
- FWindows.add(TCHMWindow.Create(strs[j]));
- secFiles : ; // already done
- secMergeFiles: FMergeFiles.Assign(Strs); // just a filelist
- secAlias : ; // already done
- secMap : ; // already done
- secInfoTypes : ; // unused for now.
- secTextPopups: ; // rarely used.
- end;
- end;
- secs.free;
- strs.free;
- fini.free;
- ScanHtmlContents:=true;
- end;
- procedure TChmProject.AddFileWithContext(contextid:integer;filename:ansistring;contextname:ansistring='');
- var x : integer;
- nd : TChmContextNode;
- begin
- x:=files.indexof(filename);
- if x=-1 then
- begin
- nd:=TChmContextNode.Create;
- nd.urlname:=filename;
- nd.contextnumber:=contextid;
- nd.contextname:=contextname;
- Files.AddObject(nd.urlname,nd);
- end
- else
- begin
- nd:=TChmContextNode(files.objects[x]);
- if not assigned(nd) then
- begin
- nd:=TChmContextNode.Create;
- nd.urlname:=filename;
- files.objects[x]:=nd;
- end;
- nd.contextnumber:=contextid;
- nd.contextname:=contextname;
- end;
- end;
- procedure TChmProject.SaveToFile(AFileName: String);
- var
- Cfg: TXMLConfig;
- I : Integer;
- nd : TChmContextNode;
- begin
- Cfg := TXMLConfig.Create(nil);
- Cfg.StartEmpty := True;
- Cfg.Filename := AFileName;
- Cfg.Clear;
- Cfg.SetValue('Files/Count/Value', Files.Count);
- for I := 0 to Files.Count-1 do
- begin
- nd:=TChmContextNode(files.objects[i]);
- Cfg.SetValue('Files/FileName'+IntToStr(I)+'/Value', Files.Strings[I]);
- if assigned(nd) then
- begin
- Cfg.SetValue('Files/FileName'+IntToStr(I)+'/ContextNumber', nd.contextnumber);
- Cfg.SetValue('Files/FileName'+IntToStr(I)+'/ContextName', nd.contextname);
- end;
- end;
- Cfg.SetValue('OtherFiles/Count/Value', OtherFiles.Count);
- for I := 0 to OtherFiles.Count-1 do
- Cfg.SetValue('OtherFiles/FileName'+IntToStr(I)+'/Value', OtherFiles.Strings[I]);
- Cfg.SetValue('Windows/Count/Value', FWindows.count);
- for i:=0 To FWindows.Count-1 do
- TCHMWindow(FWindows[i]).savetoxml(cfg,'Windows/item'+inttostr(i)+'/');
- Cfg.SetValue('MergeFiles/Count/Value', FMergeFiles.count);
- for i:=0 To FMergeFiles.Count-1 do
- Cfg.SetValue('MergeFiles/FileName'+IntToStr(I)+'/value',FMergeFiles[i]);
- // delete legacy keys.
- Cfg.DeleteValue('Files/IndexFile/Value');
- Cfg.DeleteValue('Files/TOCFile/Value');
- Cfg.DeleteValue('Files/MakeBinaryTOC/Value');
- Cfg.DeleteValue('Files/MakeBinaryIndex/Value');
- Cfg.SetValue('Settings/IndexFile/Value', IndexFileName);
- Cfg.SetValue('Settings/TOCFile/Value', TableOfContentsFileName);
- Cfg.SetValue('Settings/MakeBinaryTOC/Value',MakeBinaryTOC);
- Cfg.SetValue('Settings/MakeBinaryIndex/Value',MakeBinaryIndex);
- Cfg.SetValue('Settings/AutoFollowLinks/Value', AutoFollowLinks);
- Cfg.SetValue('Settings/MakeSearchable/Value', MakeSearchable);
- Cfg.SetValue('Settings/DefaultPage/Value', DefaultPage);
- Cfg.SetValue('Settings/Title/Value', Title);
- Cfg.SetValue('Settings/OutputFileName/Value', OutputFileName);
- Cfg.SetValue('Settings/DefaultFont/Value', DefaultFont);
- Cfg.SetValue('Settings/DefaultWindow/Value', DefaultWindow);
- Cfg.SetValue('Settings/ScanHtmlContents/Value', ScanHtmlContents);
- Cfg.Flush;
- Cfg.Free;
- end;
- function TChmProject.ProjectDir: String;
- begin
- Result := ExtractFilePath(FileName);
- end;
- procedure TChmProject.Error(errorkind:TChmProjectErrorKind;msg:String;detaillevel:integer=0);
- begin
- if assigned(OnError) then
- OnError(self,errorkind,msg,detaillevel);
- end;
- const
- protocols : array[0..3] of string = ('HTTP:','FTP:','MS-ITS:', 'MAILTO:');
- protocollen : array[0..3] of integer= ( 5 ,4 ,7, 7);
- function TChmProject.SanitizeURL(const basepath,instring,localpath,localname:string;var outstring:String):Boolean;
- var i,j,len : integer;
- Anchor: String;
- begin
- result:=true; outstring:='';
- if instring='' then
- exit(false);
- len:=length(instring);
- if len=0 then
- exit(false);
- { Check for protocols before adding local path }
- i:=0;
- while (i<=high(protocols)) do
- begin
- if strlicomp(@protocols[i][1],@instring[1],protocollen[i])=0 then
- exit(false);
- inc(i);
- end;
- outstring:=localpath+instring;
- i:=pos('#',outstring);
- if i<>0 then begin
- if i > 1 then
- Anchor := outstring
- else
- Anchor := localname+outstring;
- j := fAnchorList.IndexOf(Anchor);
- if j < 0 then begin
- fAnchorList.AddObject(Anchor,TFirstReference.Create(localname));
- Anchor := '(new) '+Anchor;
- end;
- Error(CHMNote, 'Anchor found '+Anchor+' while scanning '+localname,1);
- delete(outstring,i,length(outstring)-i+1);
- end;
- outstring:=expandfilename(StringReplace(outstring,'%20',' ',[rfReplaceAll]));// expandfilename(instring));
- outstring:=extractrelativepath(basepath,outstring);
- outstring:=StringReplace(outstring,'\','/',[rfReplaceAll]);
- end;
- function TChmProject.FileInTotalList(const s:String):boolean;
- begin
- FSpareString.TheString:=S;
- result:=assigned(fTotalFileList.FindKey(FSpareString,@CompareStrings));
- end;
- procedure TChmProject.ScanList(toscan,newfiles:TStrings;recursion:boolean);
- // toscan, list to search for htmlfiles to scan.
- // newfiles, the resulting list of files.
- // totalfilelist, the list that contains all found and specified files to check against.
- // localfilelist (local var), files found in this file.
- var
- localpath : string;
- function findattribute(node:TDomNode;attributename:string):String;
- var
- Attributes: TDOMNamedNodeMap;
- atnode : TDomNode;
- n : integer;
- begin
- Result := '';
- if assigned(node) then
- begin
- Attributes:=node.Attributes;
- if assigned(attributes) then
- for n:=0 to attributes.length-1 do
- begin
- atnode :=attributes[n];
- if assigned(atnode) and (uppercase(atnode.nodename)=attributename) then
- exit(atnode.nodevalue);
- end;
- end;
- end;
- procedure checkattributes(node:TDomNode;attributename:string; const localname: string; filelist :TStringList);
- var
- fn : String;
- val : String;
- begin
- val := findattribute(node,attributename);
- if sanitizeurl(fbasepath,val,localpath,localname,fn) then
- if (Length(fn) > 0) { Skip links to self using named anchors }
- and not FileInTotalList(uppercase(fn)) then
- filelist.add(fn);
- end;
- function scantags(prnt:TDomNode; const localname: string; filelist:TStringlist):TDomNode;
- // Seach first matching tag in siblings
- var chld: TDomNode;
- s : ansistring;
- i : Integer;
- begin
- result:=nil;
- if assigned(prnt ) then
- begin
- chld:=prnt.firstchild;
- while assigned(chld) do
- begin
- scantags(chld, localname, filelist); // depth first.
- if (chld is TDomElement) then
- begin
- s:=uppercase(tdomelement(chld).tagname);
- if s='LINK' then
- begin
- //printattributes(chld,'');
- checkattributes(chld,'HREF',localname,filelist);
- end;
- if s='IMG'then
- begin
- //printattributes(chld,'');
- checkattributes(chld,'SRC',localname,filelist);
- end;
- if s='A'then
- begin
- //printattributes(chld,'');
- checkattributes(chld,'HREF',localname,filelist);
- s := findattribute(chld,'NAME');
- if s <> '' then
- begin
- i := fAnchorList.IndexOf(localname+'#'+s);
- if i < 0 then begin
- fAnchorList.Add(localname+'#'+s);
- Error(ChmNote,'New Anchor with name '+s+' found while scanning '+localname,1);
- end else if fAnchorList.Objects[i] = nil then
- Error(chmwarning,'Duplicate anchor definitions with name '+s+' found while scanning '+localname,1)
- else begin
- fAnchorList.Objects[i].Free;
- fAnchorList.Objects[i] := nil;
- Error(ChmNote,'Anchor with name '+s+' defined while scanning '+localname,1);
- end;
- end;
- end;
- end;
- chld:=chld.nextsibling;
- end;
- end;
- end;
- var
- localfilelist: TStringList;
- domdoc : THTMLDocument;
- i,j : Integer;
- fn,s : string;
- ext : String;
- tmplst : Tstringlist;
- strrec : TStringIndex;
- //localpath : string;
- function trypath(const vn:string):boolean;
- var vn2: String;
- strrec : TStringIndex;
- begin
- vn2:=uppercase(vn);
- if FileInTotalList(vn2) then
- begin
- Error(ChmNote,'Found duplicate file '+vn+' while scanning '+fn,1);
- exit(true);
- end;
- result:=false;
- if fileexists(vn) then // correct for relative path .html file?
- begin
- result:=true;
- StrRec:=TStringIndex.Create;
- StrRec.TheString:=vn2;
- StrRec.Strid :=0;
- fTotalFileList.Add(StrRec);
- newfiles.add(vn);
- Error(ChmNote,'Found file '+vn+' while scanning '+fn,1);
- end;
- end;
- begin
- localfilelist:=TStringList.Create;
- for j:=0 to toscan.count-1 do
- begin
- fn:=toscan[j];
- localfilelist.clear;
- if (FAllowedExtensions.Indexof(uppercase(extractfileext(fn)))<>-1) then
- begin
- if fileexists(fn) then
- begin
- domdoc:=THtmlDocument.Create;
- try
- Error(chmnote,'Scanning file '+fn+'.',5);
- ReadHtmlFile(domdoc,fn);
- localpath:=extractfilepath(fn);
- if (length(localpath)>0) and not (localpath[length(localpath)] in ['/','\']) then
- localpath:=localpath+pathsep;
- scantags(domdoc,extractfilename(fn),localfilelist);
- for i:=0 to localFilelist.count-1 do
- begin
- s:=localfilelist[i];
- if not trypath(s) then
- // if not trypath(localpath+s) then
- Error(ChmWarning,'Found file '+s+' while scanning '+fn+', but couldn''t find it on disk',2);
- end;
- except
- on e:exception do
- Error(ChmError,'Html parsing '+fn+', failed. Please submit a bug.');
- end;
- domdoc.free;
- end
- else
- begin
- Error(chmnote,'Can''t find file '+fn+' to scan it.',5);
- end;
- end
- else
- Error(chmnote,'Not scanning file because of unknown extension '+fn,5);
- end;
- localfilelist.free;
- if (newfiles.count>0) and recursion then
- begin
- tmplst:=TStringList.Create;
- scanlist(newfiles,tmplst,true);
- newfiles.addstrings(tmplst);
- tmplst.free;
- end;
- end;
- procedure TChmProject.ScanSitemap(sitemap:TChmSiteMap;newfiles:TStrings;recursion:boolean);
- procedure scanitems(it:TChmSiteMapItems);
- var i : integer;
- x : TChmSiteMapItem;
- s : string;
- strrec : TStringIndex;
- begin
- for i:=0 to it.count -1 do
- begin
- x:=it.item[i];
- if sanitizeurl(fbasepath,x.local,'','Site Map for '+x.Text,S) then // sanitize, remove stuff etc.
- begin
- if not FileInTotalList(uppercase(s)) then
- begin
- if fileexists(s) then
- begin
- Error(chmnote,'Good url: '+s+'.',5);
- StrRec:=TStringIndex.Create;
- StrRec.TheString:=uppercase(s);
- StrRec.Strid :=0;
- fTotalFileList.Add(StrRec);
- newfiles.add(s);
- end
- else
- Error(chmnote,'duplicate url: '+s+'.',5);
- end
- else
- Error(chmnote,'duplicate url: '+s+'.',5);
- end
- else
- Error(chmnote,'Bad url: '+s+'.',5);
- if assigned(x.children) and (x.children.count>0) then
- scanitems(x.children);
- end;
- end;
- var i : integer;
- localfilelist: TStringList;
- begin
- localfilelist:=TStringList.Create;
- scanitems(sitemap.items);
- scanlist(newfiles,localfilelist,true);
- newfiles.addstrings(localfilelist);
- localfilelist.free;
- end;
- procedure TChmProject.ScanHtml;
- var
- helplist,
- localfilelist: TStringList;
- i : integer;
- strrec : TStringIndex;
- begin
- for i:=0 to otherfiles.count-1 do
- begin
- StrRec:=TStringIndex.Create;
- StrRec.TheString:=uppercase(otherfiles[i]);
- StrRec.Strid :=0;
- fTotalFileList.Add(StrRec);
- end;
- for i:=0 to files.count-1 do
- begin
- StrRec:=TStringIndex.Create;
- StrRec.TheString:=uppercase(files[i]);
- StrRec.Strid :=0;
- fTotalFileList.Add(StrRec);
- end;
- localfilelist:= TStringList.create;
- scanlist(ffiles,localfilelist,true);
- otherfiles.addstrings(localfilelist);
- localfilelist.clear;
- if (FDefaultpage<>'') and (not FileInTotalList(uppercase(fdefaultpage))) then
- begin
- Error(chmnote,'Scanning default file : '+fdefaultpage+'.',3);
- helplist:=TStringlist.Create;
- helplist.add(fdefaultpage);
- scanlist(helplist,localfilelist,true);
- otherfiles.addstrings(localfilelist);
- localfilelist.clear;
- end;
- if assigned(FToc) then
- begin
- Error(chmnote,'Scanning TOC file : '+FTableOfContentsFileName+'.',3);
- try
- scansitemap(ftoc,localfilelist,true);
- otherfiles.addstrings(localfilelist);
- except
- on e: Exception do
- error(chmerror,'Error scanning TOC file ('+FTableOfContentsFileName+')');
- end;
- end;
- LocalFileList.clear;
- if assigned(FIndex) then
- begin
- Error(chmnote,'Scanning Index file : '+FIndexFileName+'.',3);
- try
- scansitemap(FIndex,localfilelist,true);
- otherfiles.addstrings(localfilelist);
- except
- on e: Exception do
- error(chmerror,'Error scanning index file ('+FIndexFileName+')');
- end;
- end;
- localfilelist.free;
- end;
- procedure TChmProject.WriteChm(AOutStream: TStream);
- var
- Writer : TChmWriter;
- TOCStream,
- IndexStream: TFileStream;
- nd : TChmContextNode;
- I : Integer;
- begin
- LoadSiteMaps;
- // Scan html for "rest" files.
- If ScanHtmlContents Then
- ScanHtml; // Since this is slowing we opt to skip this step, and only do this on html load.
- IndexStream := nil;
- TOCStream := nil;
- Writer := TChmWriter.Create(AOutStream, False);
- // our callback to get data
- Writer.OnGetFileData := @GetData;
- Writer.OnLastFile := @LastFileAdded;
- // give it the list of html files
- Writer.FilesToCompress.AddStrings(Files);
- // give it the list of other files
- Writer.FilesToCompress.AddStrings(OtherFiles);
- // now some settings in the chm
- Writer.DefaultPage := DefaultPage;
- Writer.Title := Title;
- Writer.DefaultFont := DefaultFont;
- Writer.FullTextSearch := MakeSearchable;
- Writer.HasBinaryTOC := MakeBinaryTOC;
- Writer.HasBinaryIndex := MakeBinaryIndex;
- Writer.IndexName := ExtractFileName(IndexFileName);
- Writer.TocName := ExtractFileName(TableOfContentsFileName);
- Writer.ReadmeMessage := ReadmeMessage;
- Writer.DefaultWindow := FDefaultWindow;
- for i:=0 to files.count-1 do
- begin
- nd:=TChmContextNode(files.objects[i]);
- if not fileexists(files[i]) then
- Error(chmWarning,'File '+Files[i]+' does not exist');
- if assigned(nd) and (nd.contextnumber<>0) then
- Writer.AddContext(nd.ContextNumber,files[i]);
- end;
- if FWIndows.Count>0 then
- Writer.Windows:=FWIndows;
- if FMergeFiles.Count>0 then
- Writer.Mergefiles:=FMergeFiles;
- if assigned(ftoc) then
- Writer.TocSitemap:=ftoc;
- // and write!
- Error(chmnone,'Writing CHM '+OutputFileName,0);
- Writer.Execute;
- if Assigned(TOCStream) then TOCStream.Free;
- if Assigned(IndexStream) then IndexStream.Free;
- Writer.Free;
- end;
- procedure TChmProject.ShowUndefinedAnchors;
- var
- i:Integer;
- begin
- for i := 0 to fAnchorList.Count-1 do
- if fAnchorList.Objects[i] <> nil then
- Error(chmerror,'Anchor '+fAnchorList[i]+' undefined; first use '+TFirstReference(fAnchorList.Objects[i]).Location);
- end;
- procedure TChmProject.LoadSitemaps;
- // #IDXHDR (merged files) goes into the system file, and need to keep TOC sitemap around
- begin
- if FTableOfContentsFileName<>'' then
- begin
- if fileexists(FTableOfContentsFileName) then
- begin
- FTocStream:=TMemoryStream.Create;
- try
- FTocStream.loadfromfile(FTableOfContentsFilename);
- writeln(ftableofcontentsfilename, ' ' ,ftocstream.size);
- FTocStream.Position:=0;
- FToc:=TChmSiteMap.Create(sttoc);
- FToc.loadfromstream(FTocStream);
- ftoc.savetofile('bla.something');
- except
- on e:exception do
- begin
- error(chmerror,'Error loading TOC file '+FTableOfContentsFileName);
- freeandnil(ftoc); freeandnil(FTocStream);
- end;
- end;
- end
- else
- error(chmerror,'Can''t find TOC file'+FTableOfContentsFileName);
- end;
- if FIndexFileName<>'' then
- begin
- if fileexists(FIndexFileName) then
- begin
- FIndexStream:=TMemoryStream.Create;
- try
- FIndexStream.LoadFromFile(FIndexFileName);
- FIndexStream.Position:=0;
- FIndex:=TChmSiteMap.Create(stindex);
- FIndex.loadfromfile(FIndexFileName);
- except
- on e: Exception do
- begin
- error(chmerror,'Error loading index file '+FIndexFileName);
- freeandnil(findex); freeandnil(findexstream);
- end;
- end;
- end
- else
- error(chmerror,'Can''t find index file '+FIndexFileName);
- end;
- end;
- end.
|