From 22d49fccda65123115a7739f0f24eb4b966ae811 Mon Sep 17 00:00:00 2001 From: Graeme Geldenhuys Date: Fri, 13 Aug 2010 16:57:46 +0200 Subject: minor changes to INF format document --- docview/docs/inf04.txt | 42 +++++++++++++++++++++++++++++++++++------- 1 file changed, 35 insertions(+), 7 deletions(-) (limited to 'docview/docs') diff --git a/docview/docs/inf04.txt b/docview/docs/inf04.txt index 6ad23d9f..ac7cca8d 100644 --- a/docview/docs/inf04.txt +++ b/docview/docs/inf04.txt @@ -51,18 +51,25 @@ -- Marcus Groeber (marcusg@ph-cip.uni-koeln.de - Fidonet 2:243/8605.1) + *** introduction to version 3 *** Just a bit of an update and flesh out ;-) -- Peter Childs (pjchilds@apanix.apana.org.au) + *** Version 4 **** Further additions as found while writing NewView -- Aaron Lawrence + Some more info and corrections while writing fpGUI's DocView + + -- Graeme Geldenhuys + + **** Types **** All numeric quantities are least-significant-byte first in the file @@ -75,6 +82,7 @@ int16 16 bit unsigned integer int32 32 bit unsigned integer + **** The File Header **** Starting at file offset 0 the following structure can overlay the file @@ -98,8 +106,8 @@ int32 tocstrlen; // number of bytes in file occupied by the // table-of-contents entries int32 tocstart; // 32 bit file offset of the start of tocarray - int16 nres; // number of panels with ressource numbers - int32 resstart; // 32 bit file offset of ressource number table + int16 nres; // number of panels with resource numbers + int32 resstart; // 32 bit file offset of resource number table int16 nname; // number of panels with textual name int32 namestart; // 32 bit file offset to panel name table int16 nindex; // number of index entries @@ -122,6 +130,7 @@ char8 title[48]; // ASCII title of database } + **** The table of contents entries **** Beginning at each file offset, tocentrystart[i]: @@ -223,6 +232,7 @@ skip over bytestoskip bytes (after w2) and find the tocslots and title as in the non-extended case. + **** The table of contents array **** Beginning at file offset tocstart, this structure can overlay the @@ -232,6 +242,7 @@ // tocentries (above) } + **** The Slots array **** Beginning at file offset slotsstart (provided by the file header) find @@ -240,6 +251,7 @@ // corresponding to this slot } + **** The Dictionary **** Beginning at file offset dictstart (provided by the file header) and @@ -251,6 +263,7 @@ char8* strings[ndict]; } + **** The Article entries **** Beginning at file offset slots[i] the following structure can overlay @@ -263,6 +276,7 @@ int8 text[ntext]; // encoded text of the article } + **** The Local dictionary **** Beginning at file position localdictpos (for each article) there is an @@ -271,6 +285,7 @@ int16 localwords[nlocaldict]; } + **** The Text **** The text for an article then consists of words obtained by referencing @@ -291,6 +306,7 @@ dictionary. Examples are entered and left with 0xff escape sequences. The variable "spacing" is initially (start of every article slot) TRUE. + **** 0xff escape sequences **** These are used to change fonts, make cross references, enter and leave @@ -456,15 +472,17 @@ The font used in the text is the normal IBM extended character set, including line graphics and some of the characters below 32. - **** The ressource number array **** + + **** The resource number array **** Beginning at file offset resstart, this structure can overlay the file: { - int16 res[nres]; // ressource number of panels + int16 res[nres]; // resource number of panels int16 toc[nres]; // toc entry number of panel } + **** The text name array **** Beginning at file offset namestart, this structure can overlay the @@ -474,6 +492,7 @@ int16 toc[nres]; // toc entry number of panel } + **** The index table **** Beginning at file offset indexstart, a structure like the following @@ -492,11 +511,13 @@ int32 synonyms; // 32 bit file offset to start of synonyms referencing this word } + **** The extended data block **** Not yet decoded. This block has a size of 64 bytes and contains various pointers to font names, names of externel databases etc. + **** The full text search table **** Not yet decoded. This table is supressed when "/S" is specified on @@ -567,17 +588,21 @@ int8 dataType; // 0 = uncompressed 2 = compressed data... - Compression is LZW (Lempel Ziv XX?) + Compression is LZW (Lempel Ziv Welch) } + **** NLS table **** Not yet decoded. This table contains informations specific to the language and codepage the document was prepared in. It seems to contain some bitfields as well that might be used for character classification. -Appendix 1: Some useful translations from IBM Extended ASCII to normal ASCII + +Appendix 1: +----------- +Some useful translations from IBM Extended ASCII to normal ASCII One other transformation I had to make was of the character box characters of the IBM extended ASCII set. These characters appear in strings @@ -610,7 +635,9 @@ Appendix 1: Some useful translations from IBM Extended ASCII to normal ASCII can't tell which from my translation -Appendix 2: Style codes for escCode 0x04 and 0x0D +Appendix 2: +----------- +Style codes for escCode 0x04 and 0x0D escCode 0x04 implements font changes associated with the :hp# IPF source tag. @@ -631,6 +658,7 @@ Appendix 2: Style codes for escCode 0x04 and 0x0D History: +-------- October 22, 1992: version for initial posting (inf01.doc) July 12, 1993: second version (refer to introduction for changes) (inf02.doc) July 18, 1993: added appendices to the second version (inf02a.doc) -- cgit v1.2.3-70-g09d2