ref: 47ec5de29e56c4cf223e0582b930b88ca2a589ee
dir: /sys/src/cmd/gs/lib/dumphint.ps/
% Copyright (C) 2000, 2001 Aladdin Enterprises. All rights reserved. % % This software is provided AS-IS with no warranty, either express or % implied. % % This software is distributed under license and may not be copied, % modified or distributed except as expressly authorized under the terms % of the license contained in the file LICENSE in this distribution. % % For more information about licensing, please refer to % http://www.ghostscript.com/licensing/. For information on % commercial licensing, go to http://www.artifex.com/licensing/ or % contact Artifex Software, Inc., 101 Lucas Valley Road #110, % San Rafael, CA 94903, U.S.A., +1(415)492-9861. % $Id: dumphint.ps,v 1.2 2004/04/08 16:18:25 giles Exp $ % Linearized PDF hint formatting utility. % % Linearized PDF hints generated by Acrobat suite seem to deviate from % the published specification. % % /P (page offset hint table) key in hint stream is not generated by % Adobe products. The key is no longer required in PDF 1.5. % % Per-page items 4 and 5 of the page offset hint table start from 1st % page rather than 2nd page as the spec claims. % % All array entries start from the new byte boundary. % /table_width 79 def /col1_width 66 def % Skip bits to the next byte boundary /bytealign { % <stream> bytealign - begin /N 0 def /B 0 def end } bind def % Set bit stream position and align it to byte boundary /set_align { % <<>> pos set_align - exch begin S exch setfileposition /N 0 def /B 0 def end } bind def % Read requested number of bits from the bit stream. /bitread { % <bstream> <width> bitwrite <value> exch begin 0 % bit val { 1 index N .min % bit val m dup 3 1 roll % bit m val m bitshift % bit m val<<m B 2 index N sub % bit m val<<m B m-N bitshift add % bit m val<<m+B>>(N-m) 3 -1 roll % m val' bit 2 index sub % m val' bit' 3 -1 roll % val' bit' m N exch sub dup % val' bit' N' N' 1 exch bitshift % val' bit' N' 1<<N' 1 sub B and % val' bit' N' B&(1<<N') /B exch def % val' bit' N' /N exch def % val' bit' dup 0 le { pop exit % val' } if /N N 8 add def /B B 8 bitshift S read not { 0 ( *** EOF! *** ) = } if add def exch } loop % bit' val' end } bind def % Print a string several times /multiprint { % cnt (s) multiprint - exch { dup print } repeat pop } bind def % Split the line into 2 substrings. /split_line { % (s) split_line () () dup length col1_width gt { col1_width 1 sub dup -1 0 { dup % (s) w i i 3 index % (s) w i i () exch get % (s) w i c 32 eq { exch pop exit } if pop } for 1 add % (s) w' 1 index exch % (s) (s) w' 0 exch % (s) (s) 0 w' getinterval % (s) (v) } { dup % (s) (s) } ifelse (\n) search { 4 1 roll % (pre) (s) (post) (match) pop pop % (pre) (s) 1 index length % (pre) (s) len 1 add % (pre) (s) len+1 } { exch % (pre) (s) 1 index length % (pre) (s) len } ifelse 1 index length % (pre) (s) len Len 1 index sub % (pre) (s) len Len-len getinterval % (pre) (post) } bind def % Print a 2 column table. The string is printed in 1st column % left-aligned. The number is printed in 2nd column right-aligned. /two_column { % n () two_column - split_line % n (a) () 3 1 roll % () n (a) dup length % () n (a) len exch print % () n len exch =string cvs % () len (n) dup length % () len (n) len2 3 -1 roll add % () (n) len+len2 //table_width % () (n) len+len2 78 exch sub % () (n) 78-len+len2 ( ) multiprint % () (n) = % () { dup length 0 eq { exit } if split_line exch = } loop pop () = } bind def % Print the header of a hint table /table_header { % () table_header - dup length dup table_width exch sub 2 idiv % () len sp dup ( ) multiprint % () len sp 3 -1 roll = % len sp ( ) multiprint % len (=) multiprint ()= ()= } bind def % Pretty-print an array on top level /dump_array { % [ ] dump_array - ([) = ( ) print 1 exch { =string cvs % pos () dup length dup % pos () len len 3 index add 1 add % pos () len len+pos+1 table_width gt { () = ( ) print % pos () len 2 add % pos () pos' 3 1 roll print pop % pos' } { ( ) print % pos () len exch print % pos len add 1 add % pos' } ifelse } forall pop () = (]) = } bind def % Pretty-print an array on 2nd level /dump_array2 { % [ ] dump_array2 - ( [) print 3 exch { =string cvs % pos () dup length dup % pos () len len 3 index add 1 add % pos () len len+pos+1 table_width 2 sub gt { () = ( ) print % pos () len 4 add % pos () pos' 3 1 roll print pop % pos' } { ( ) print % pos () len exch print % pos len add 1 add % pos' } ifelse } forall pop ( ]) = } bind def % Print an array header /array_header { () = = } bind def % Analyze the page offset hint table. /dump_page_offset_table { % - dump_page_offset_table - hint_stream dup 32 bitread dup /hint_minnop exch def (1. The least number of objects in a page.) two_column dup 32 bitread dup /hint_1st_obj exch def (2. Location of the first page's page object.) two_column dup 16 bitread dup /hint_maxnopbits exch def (3. Bits for difference between max and min number of page objects.) two_column dup 32 bitread dup /hint_minpl exch def (4. Least length of a page.) two_column dup 16 bitread dup /hint_maxplbits exch def (5. Bits for difference between max and min length of a page.) two_column dup 32 bitread dup /hint_minsco exch def (6. Least start of Contents offset. ) 1 index 0 ne { (\n*** Acrobat expects 0 ***) concatstrings } if two_column dup 16 bitread dup /hint_maxscobits exch def (7. Bits for difference between max and min offset to the start of the content stream.) two_column dup 32 bitread dup /hint_mincl exch def (8. Least contents length.) two_column dup 16 bitread dup /hint_maxclbits exch def (9. Bits needed to represent the greatest Contents length.) two_column dup 16 bitread dup /hint_maxsorbits exch def (10. Bits needed to represent the greatest number of Shared Object references.) two_column dup 16 bitread dup /hint_sobits exch def (11. Bits needed to identify a Shared Object.) two_column dup 16 bitread dup /hint_numfbits exch def (12. Bits needed to represent numerator of fraction.) two_column dup 16 bitread dup /hint_denf exch def (13. Denominator of fraction.) two_column pop LinearizationParams /N get % 1. Number of objects in the page. hint_stream bytealign /hint_page_obj [ 2 index { hint_stream hint_maxnopbits bitread hint_minnop add } repeat ] readonly def (1. Number of objects on the page) array_header hint_page_obj dump_array % 2, Page length in bytes. hint_stream bytealign /hint_page_len [ 2 index { hint_stream hint_maxplbits bitread hint_minpl add } repeat ] readonly def (2. Page length in bytes.) array_header hint_page_len dump_array % 3, Number of shared objects referenced from the page hint_stream bytealign /hint_page_sobj [ 2 index { hint_stream hint_maxsorbits bitread } repeat ] readonly def (3. Number of shared objects referenced from the page.) array_header hint_page_sobj dump_array % 4. Index into the shared objects hint table hint_stream bytealign /hint_page_sobj_id [ 0 1 4 index 1 sub { hint_page_sobj exch get [ exch { hint_stream hint_sobits bitread } repeat ] readonly } for ] readonly def (4. Index into the shared objects hint table.) array_header ([) = hint_page_sobj_id { dump_array2 } forall (])= % 5. Fractional position for each shared object reference hint_stream bytealign /hint_page_sobj_pos [ 0 1 4 index 1 sub { hint_page_sobj exch get [ exch { hint_stream hint_numfbits bitread hint_denf div } repeat ] readonly } for ] readonly def (5. Fractional position for each shared object reference. ) array_header ([)= hint_page_sobj_pos { dump_array2 } forall (])= % 6. Offset of the page's content stream from the beginning of the page. hint_stream bytealign /hint_page_content_offset [ 2 index { hint_stream hint_maxscobits bitread hint_minsco add } repeat ] readonly def (6. Offset of the page's content stream from the beginning of the page.) array_header hint_page_content_offset dump_array % 7. Length of the page's content stream in bytes. hint_stream bytealign /hint_page_content_len [ 2 index { hint_stream hint_maxclbits bitread hint_mincl add } repeat ] readonly def (7. Length of the page's content stream in bytes.) array_header hint_page_content_len dump_array pop } bind def % Analyze tha shared object hint table /dump_shared_object_table { hint_stream dup 32 bitread dup /shint_1st_obj_id exch def (1. Object number of the first object in the shared objects section) two_column dup 32 bitread dup /shint_1st_obj_pos exch def (2. Location of the first object in the shared objects section.) two_column dup 32 bitread dup /shint_1st_shared exch def (3. The number of shared object entries for the first page.) two_column dup 32 bitread dup /shint_all_shared exch def (4. Number of shared object entries for the shared objects section including 1st page.) two_column dup 16 bitread dup /shint_group_bits exch def (5. Number of bits needed to represent the greatest number of objects in a shared object group.) two_column dup 32 bitread dup /shint_group_least_sz exch def (6. Least length of a shared object group in bytes.) two_column dup 16 bitread dup /shint_group_diff_bits exch def (7. Bits for the difference between the greatest and least length of a shared object group size.) two_column pop (1. length of the object group in bytes.) array_header hint_stream bytealign /shint_group_sz [ shint_all_shared { hint_stream shint_group_diff_bits bitread shint_group_least_sz add } repeat ] readonly def shint_group_sz dump_array (2. MD5 signature flag) array_header hint_stream bytealign /shint_md5_flags [ shint_all_shared { hint_stream 1 bitread } repeat ] readonly def shint_md5_flags dump_array (3. MD5 signature string) array_header false shint_md5_flags { 0 ne or } forall { shint_md5_flags { 0 eq { (<>)= } { hint_stream /S get 128 string readstring pop dup length 128 eq { == } { pop (Error reading nd5 string.) == } ifelse } ifelse } forall } { () = (none) = } ifelse (4. The number of objects in the group.) array_header hint_stream bytealign /shint_group_cnt [ shint_all_shared { hint_stream shint_group_bits bitread } repeat ] readonly def shint_group_cnt dump_array } bind def % Analyze the thumbnail hint table. /dump_thumbnail_table { hint_stream dup 32 bitread dup /thint_1st_obj_id exch def (1. Object number of the first thumbnail image.) two_column dup 32 bitread dup /thint_1st_obj_pos exch def (2. Location of the first thumbnail image.) two_column dup 32 bitread dup /thint_page_cnt exch def (3. Number of pages that have thumbnail images.) two_column dup 16 bitread dup /thint_no_thumbnail_bits exch def (4. Bits for the max number of consecutive pages without a thumbnail image.) two_column dup 32 bitread dup /thint_min_sz exch def (5. The least length of a thumbnail image in bytes.) two_column dup 15 bitread dup /thint_obj_sz_bits exch def (6. Bits for the difference between max and min length of a thumbnail image.) two_column dup 32 bitread dup /thint_min_obj_cnt exch def (7. The least number of objects in a thumbnail image.) two_column dup 16 bitread dup /thint_obj_cnt_bits exch def (8. Bits for the difference between max and min number of objects in a thumbnail image.) two_column dup 32 bitread dup /thint_1st_shared_obj exch def (9. First object in the thumbnail shared objects section.) two_column dup 32 bitread dup /thint_1st_shared_pos exch def (10. Location of the first object in the thumbnail shared objects section.) two_column dup 32 bitread dup /thint_shared_cnt exch def (11. Number of thumbnail shared objects.) two_column dup 32 bitread dup /thint_shared_section_sz exch def (12. Length of the thumbnail shared objects section in bytes.) two_column pop LinearizationParams /N get (1. The number of preceding pages lacking a thumbnail image.) array_header hint_stream bytealign /thint_no_thumbnail_pages [ 2 index { hint_stream thint_no_thumbnail_bits bitread } repeat ] readonly def thint_no_thumbnail_pages dump_array (2. Number of objects in this page's thumbnail image.) array_header hint_stream bytealign /thint_page_obj_cnt [ 2 index { hint_stream thint_obj_cnt_bits bitread thint_min_obj_cnt add } repeat ] readonly def thint_page_obj_cnt dump_array (3. Length of this page's thumbnail image in bytes.) array_header hint_stream bytealign /thint_page_obj_sz [ 2 index { hint_stream thint_obj_sz_bits bitread thint_min_sz add } repeat ] readonly def thint_page_obj_sz dump_array pop } bind def % Analyze the generic hint table. % The hint field names are re-used. /dump_generic_table { hint_stream dup 32 bitread dup /ghint_1st_obj exch def (1. Object number of the first object in the group.) two_column dup 32 bitread dup /ghint_1st_obj_pos exch def (2. Location of the first object in the group.) two_column dup 32 bitread dup /ghint_obj_cnt exch def (3. Number of objects in the group.) two_column dup 32 bitread dup /ghint_group_sz exch def (4. Length of the object group in bytes.) two_column pop } bind def % Analyze the interactive hint table. % The hint field names are re-used. /dump_interactive_table { hint_stream dup 32 bitread dup /ihint_1st_obj exch def (1. Object number of the first object in the group.) two_column dup 32 bitread dup /ihint_1st_obj_pos exch def (2. Location of the first object in the group.) two_column dup 32 bitread dup /ihint_obj_cnt exch def (3. Number of objects in the group.) two_column dup 32 bitread dup /ihint_group_sz exch def (4. Length of the object group in bytes.) two_column dup 32 bitread dup /ihint_shared_cnt exch def (5. Number of shared object references.) two_column dup 16 bitread dup /ihint_shared_obj_bits exch def (6. Bits for the max shared object id used by the interactive form or the logical structure hierarchy.) 1 index hint_sobits ne { (\n*** This fiels is not equal to max shared object ID bits ***) concatstrings } if pop (7. Shared object identifier.) array_header hint_stream bytealign /ihint_shared_obj_id [ ihint_shared_cnt { hint_stream hint_sobits bitread } repeat ] readonly def ihint_shared_obj_id dump_array } bind def % Enumerate all documented hint tables. /dump_all_tables { % <<stream>> dump_all_tables - (Page offset hint table) table_header hint_stream 0 set_align dump_page_offset_table (S, Shared object hint table) table_header dup /S .knownget { hint_stream exch set_align dump_shared_object_table } { (Required table is not found.) error_msg } ifelse dup /T .knownget { (T, Thumbnail hint table) table_header hint_stream exch set_align dump_thumbnail_table } if dup /O .knownget { (O, Outline hint table) table_header hint_stream exch set_align dump_generic_table } if dup /A .knownget { (A, Thread information hint table) table_header hint_stream exch set_align dump_generic_table } if dup /E .knownget { (E, Named destination hint table) table_header hint_stream exch set_align dump_generic_table } if dup /V .knownget { (V, Interactive form hint table) table_header hint_stream exch set_align dump_interactive_table } if dup /I .knownget { (I, Information dictionary hint table) table_header hint_stream exch set_align dump_generic_table } if dup /C .knownget { (C, Logical structure hint table) table_header hint_stream exch set_align dump_interactive_table } if dup /L .knownget { (L, Page label hint table) table_header hint_stream exch set_align dump_generic_table } if pop } bind def % Load PDF file and extract the hint stream. /pdf_dump_hints { % <infile> pdf_dump_hints - dup (r) file % fname false exch % fname F file { dup 7 string readstring pop % fname F file () (%PDF-1.) ne { pop exit } if % fname F file dup 0 setfileposition dup token not { pop exit } if % fname F file obj dup type /integertype ne { pop exit } if % fname F file obj 1 index token not { pop pop exit } if % fname F file obj gen dup type /integertype ne {pop pop exit}if % fname F file obj gen 4 2 roll % fname obj gen F file dup 0 setfileposition exch true or % fname obj gen file T exit } loop { pdfdict begin pdfopenfile dup begin 40 dict begin /IDict exch def .setsafe % Read all objects into memory. Trailer touch resolveR % fname <<>> dup /Linearized known { dup /L get % fname <<>> Len 3 -1 roll status not { 0 0 0 0 } if % <<>> Len pop pop exch pop % <<>> Len len eq { /LinearizationParams exch def LinearizationParams /H get dup length 2 eq { 0 get PDFoffset add PDFfile exch setfileposition PDFfile token pop PDFfile token pop resolveR dup true resolvestream /ReusableStreamDecode filter bitstream dup bytealign /hint_stream exch def dump_all_tables } { pop (Overflow hint stream is not supported.) = } ifelse } { pop (Wrong file length in linearization dictionary.) = } ifelse } { pop (The file is not linearized.) = } ifelse end % temporary dict end % IDict end } { pop (Input file is not a valid PDF file.) = } ifelse } bind def % Initial setup /dump_hints { counttomark 1 eq { exch pop save exch 3000000 setvmthreshold pdfoptdict begin pdf_dump_hints end restore true } { cleartomark false } ifelse } bind def /shellarguments {false} def (pdfopt.ps) runlibfile currentdict /shellarguments undef % Check for command line arguments. mark shellarguments { dump_hints not { (Usage: gs -dNODISPLAY -- dumphint.ps input.pdf) = flush } if } { pop } ifelse % EOF