Plan 9 from Bell Labs’s /usr/web/sources/plan9/sys/src/cmd/gs/lib/dumphint.ps

Copyright © 2021 Plan 9 Foundation.
Distributed under the MIT License.
Download the Plan 9 distribution.


% Copyright (C) 2000, 2001 Aladdin Enterprises.  All rights reserved.
% 
% This software is provided AS-IS with no warranty, either express or
% implied.
% 
% This software is distributed under license and may not be copied,
% modified or distributed except as expressly authorized under the terms
% of the license contained in the file LICENSE in this distribution.
% 
% For more information about licensing, please refer to
% http://www.ghostscript.com/licensing/. For information on
% commercial licensing, go to http://www.artifex.com/licensing/ or
% contact Artifex Software, Inc., 101 Lucas Valley Road #110,
% San Rafael, CA  94903, U.S.A., +1(415)492-9861.

% $Id: dumphint.ps,v 1.2 2004/04/08 16:18:25 giles Exp $
% Linearized PDF hint formatting utility.

%
% Linearized PDF hints generated by Acrobat suite seem to deviate from
% the published specification.
%
% /P (page offset hint table) key in hint stream is not generated by
% Adobe products. The key is no longer required in PDF 1.5.
%
% Per-page items 4 and 5 of the page offset hint table start from 1st
% page rather than 2nd page as the spec claims.
%
% All array entries start from the new byte boundary.
%

/table_width 79 def 
/col1_width  66 def

% Skip bits to the next byte boundary
/bytealign {		% <stream> bytealign -
  begin /N 0 def /B 0 def end
} bind def

% Set bit stream position and align it to byte boundary
/set_align {            % <<>> pos set_align -
  exch begin
  S exch setfileposition
  /N 0 def /B 0 def
  end
} bind def

% Read requested number of bits from the bit stream.
/bitread {		% <bstream> <width> bitwrite <value>
  exch begin
  0                     %  bit val
  { 
    1 index N .min      %  bit val m
    dup 3 1 roll        %  bit m val m 
    bitshift            %  bit m val<<m
    B 2 index N sub     %  bit m val<<m B m-N
    bitshift add        %  bit m val<<m+B>>(N-m)
    3 -1 roll           %  m val' bit 
    2 index sub         %  m val' bit'
    3 -1 roll           %  val' bit' m
    N exch sub dup      %  val' bit' N' N'
    1 exch bitshift     %  val' bit' N' 1<<N'
    1 sub B and         %  val' bit' N' B&(1<<N')
    /B exch def         %  val' bit' N'
    /N exch def         %  val' bit'
    dup 0 le {
      pop exit          %  val'
    } if
    /N N 8 add def
    /B B 8 bitshift S read not { 0 ( *** EOF! *** ) = } if add def
    exch
  } loop                %  bit' val'
  end
} bind def

% Print a string several times
/multiprint {           % cnt (s) multiprint -
  exch { dup print } repeat pop
} bind def

% Split the line into 2 substrings.
/split_line {           % (s) split_line () ()
  dup length col1_width gt {
    col1_width 1 sub
    dup -1 0 {
      dup               % (s) w i i
      3 index           % (s) w i i ()
      exch get          % (s) w i c
      32 eq {
        exch pop exit
      } if
      pop
    } for
    1 add               % (s) w'
    1 index exch        % (s) (s) w'
    0 exch              % (s) (s) 0 w'
    getinterval         % (s) (v)
  } {
    dup                 % (s) (s)
  } ifelse                  
  (\n) search {
    4 1 roll            % (pre) (s) (post) (match)
    pop pop             % (pre) (s)
    1 index length      % (pre) (s) len
    1 add               % (pre) (s) len+1
  } {
    exch                % (pre) (s)
    1 index length      % (pre) (s) len
  } ifelse
  1 index length        % (pre) (s) len Len
  1 index sub           % (pre) (s) len Len-len
  getinterval           % (pre) (post)
} bind def

% Print a 2 column table. The string is printed in 1st column
% left-aligned. The number is printed in 2nd column right-aligned.
/two_column {           % n () two_column -
  split_line            % n (a) ()
  3 1 roll              % () n (a)
  dup length            % () n (a) len
  exch print            % () n len
  exch =string cvs      % () len (n)
  dup length            % () len (n) len2
  3 -1 roll add         % () (n) len+len2 
  //table_width         % () (n) len+len2 78
  exch sub              % () (n) 78-len+len2 
  ( ) multiprint        % () (n)
  =                     % ()
  { dup length 0 eq { exit } if
    split_line exch =
  } loop
  pop
  () =
} bind def

% Print the header of a hint table
/table_header {               % () table_header -
  dup length dup
  table_width exch sub 2 idiv % () len sp
  dup ( ) multiprint          % () len sp
  3 -1 roll =                 % len sp
  ( ) multiprint              % len
  (=) multiprint
  ()= ()=
} bind def

% Pretty-print an array on top level
/dump_array {               % [ ] dump_array -
  ([) = ( ) print
  1 exch {
    =string cvs         % pos ()
    dup length dup      % pos () len len
    3 index add 1 add   % pos () len len+pos+1
    table_width gt {
      () =
      (  ) print        % pos () len
      2 add             % pos () pos'
      3 1 roll print pop % pos'
    } {
      ( ) print         % pos () len
      exch print        % pos len
      add 1 add         % pos'
    } ifelse
  } forall
  pop
  () = (]) =
} bind def

% Pretty-print an array on 2nd level
/dump_array2 {             % [ ] dump_array2 -
  (  [) print
  3 exch {
    =string cvs            % pos ()
    dup length dup         % pos () len len
    3 index add 1 add      % pos () len len+pos+1
    table_width 2 sub gt {
      () =
      (    ) print         % pos () len
      4 add                % pos () pos'
      3 1 roll print pop   % pos'
    } {
      ( ) print            % pos () len
      exch print           % pos len
      add 1 add            % pos'
    } ifelse
  } forall
  pop
  ( ]) =
} bind def

% Print an array header
/array_header {
  () = =
} bind def

% Analyze the page offset hint table.
/dump_page_offset_table {  % - dump_page_offset_table -
  hint_stream
    
  dup 32 bitread
  dup /hint_minnop exch def
  (1. The least number of objects in a page.) two_column

  dup 32 bitread
  dup /hint_1st_obj exch def
  (2. Location of the first page's page object.) two_column

  dup 16 bitread
  dup /hint_maxnopbits exch def
  (3. Bits for difference between max and min number of page objects.) two_column

  dup 32 bitread
  dup /hint_minpl exch def
  (4. Least length of a page.) two_column

  dup 16 bitread
  dup /hint_maxplbits exch def
  (5. Bits for difference between max and min length of a page.) two_column

  dup 32 bitread
  dup /hint_minsco exch def
  (6. Least start of Contents offset. ) 
  1 index 0 ne { (\n*** Acrobat expects 0 ***) concatstrings } if
  two_column

  dup 16 bitread
  dup /hint_maxscobits exch def
  (7. Bits for difference between max and min offset to the start of the content stream.) two_column

  dup 32 bitread
  dup /hint_mincl exch def
  (8. Least contents length.) two_column

  dup 16 bitread
  dup /hint_maxclbits exch def
  (9. Bits needed to represent the greatest Contents length.) two_column

  dup 16 bitread
  dup /hint_maxsorbits exch def
  (10. Bits needed to represent the greatest number of Shared Object references.) two_column

  dup 16 bitread
  dup /hint_sobits exch def
  (11. Bits needed to identify a Shared Object.) two_column

  dup 16 bitread
  dup /hint_numfbits exch def
  (12. Bits needed to represent numerator of fraction.) two_column

  dup 16 bitread
  dup /hint_denf exch def
  (13. Denominator of fraction.) two_column

  pop 

  LinearizationParams /N get

  % 1. Number of objects in the page.
  hint_stream bytealign
  /hint_page_obj [
    2 index {
      hint_stream hint_maxnopbits bitread
      hint_minnop add
    } repeat
  ] readonly def

  (1. Number of objects on the page) array_header
  hint_page_obj dump_array

  % 2, Page length in bytes.
  hint_stream bytealign
  /hint_page_len [
    2 index {
      hint_stream hint_maxplbits bitread
      hint_minpl add
    } repeat
  ] readonly def

  (2. Page length in bytes.) array_header
  hint_page_len dump_array

  % 3, Number of shared objects referenced from the page
  hint_stream bytealign
  /hint_page_sobj [
    2 index {
      hint_stream hint_maxsorbits bitread
    } repeat
  ] readonly def

  (3. Number of shared objects referenced from the page.) array_header
  hint_page_sobj dump_array

  % 4. Index into the shared objects hint table
  hint_stream bytealign
  /hint_page_sobj_id [
    0 1 4 index 1 sub {
      hint_page_sobj exch get [
        exch {
          hint_stream hint_sobits bitread
        } repeat
      ] readonly
    } for
  ] readonly def

  (4. Index into the shared objects hint table.) array_header
  ([) =
  hint_page_sobj_id { dump_array2 } forall
  (])=

  % 5. Fractional position for each shared object reference
  hint_stream bytealign
  /hint_page_sobj_pos [
    0 1 4 index 1 sub {
      hint_page_sobj exch get [
        exch {
          hint_stream hint_numfbits bitread
          hint_denf div
        } repeat
      ] readonly
    } for
  ] readonly def

  (5. Fractional position for each shared object reference. ) array_header
  ([)=
  hint_page_sobj_pos { dump_array2 } forall
  (])=

  % 6. Offset of the page's content stream from the beginning of the page.
  hint_stream bytealign
  /hint_page_content_offset [
    2 index {
      hint_stream hint_maxscobits bitread
      hint_minsco add
    } repeat
  ] readonly def

  (6. Offset of the page's content stream from the beginning of the page.) array_header
  hint_page_content_offset dump_array

  % 7. Length of the page's content stream in bytes.
  hint_stream bytealign
  /hint_page_content_len [
    2 index {
      hint_stream hint_maxclbits bitread
      hint_mincl add
    } repeat
  ] readonly def

  (7. Length of the page's content stream in bytes.) array_header
  hint_page_content_len dump_array

  pop
} bind def

% Analyze tha shared object hint table
/dump_shared_object_table { 
  hint_stream
    
  dup 32 bitread
  dup /shint_1st_obj_id exch def
  (1. Object number of the first object in the shared objects section) two_column

  dup 32 bitread
  dup /shint_1st_obj_pos exch def
  (2. Location of the first object in the shared objects section.) two_column

  dup 32 bitread
  dup /shint_1st_shared exch def
  (3. The number of shared object entries for the first page.) two_column

  dup 32 bitread
  dup /shint_all_shared exch def
  (4. Number of shared object entries for the shared objects section including 1st page.) two_column

  dup 16 bitread
  dup /shint_group_bits exch def
  (5. Number of bits needed to represent the greatest number of objects in a shared object group.) two_column

  dup 32 bitread
  dup /shint_group_least_sz exch def
  (6. Least length of a shared object group in bytes.) two_column

  dup 16 bitread
  dup /shint_group_diff_bits exch def
  (7. Bits for the difference between the greatest and least length of a shared object group size.)  two_column
  pop

  (1. length of the object group in bytes.) array_header
  hint_stream bytealign
  /shint_group_sz [
    shint_all_shared {
      hint_stream shint_group_diff_bits bitread
      shint_group_least_sz add
    } repeat
  ] readonly def

  shint_group_sz dump_array

  (2. MD5 signature flag) array_header
    hint_stream bytealign
    /shint_md5_flags
    [ shint_all_shared 
      { hint_stream 1 bitread
      } repeat
    ] readonly def

    shint_md5_flags dump_array

    (3. MD5 signature string) array_header
    false shint_md5_flags { 0 ne or } forall { 
      shint_md5_flags {
        0 eq {
          (<>)=
        } {
          hint_stream /S get 128 string
          readstring pop
          dup length 128 eq {
            ==
          } { pop (Error reading nd5 string.) ==
          } ifelse
        } ifelse
      } forall   
    } {
      () = (none) =
    } ifelse

    (4. The number of objects in the group.) array_header
    hint_stream bytealign
    /shint_group_cnt [
      shint_all_shared {
        hint_stream shint_group_bits bitread
      } repeat
    ] readonly def

    shint_group_cnt dump_array

  } bind def

% Analyze the thumbnail hint table.
/dump_thumbnail_table {
  hint_stream

  dup 32 bitread
  dup /thint_1st_obj_id exch def
  (1. Object number of the first thumbnail image.) two_column

  dup 32 bitread
  dup /thint_1st_obj_pos exch def
  (2. Location of the first thumbnail image.) two_column

  dup 32 bitread
  dup /thint_page_cnt exch def
  (3. Number of pages that have thumbnail images.) two_column

  dup 16 bitread
  dup /thint_no_thumbnail_bits exch def
  (4. Bits for the max number of consecutive pages without a thumbnail image.) two_column

  dup 32 bitread
  dup /thint_min_sz exch def
  (5. The least length of a thumbnail image in bytes.) two_column

  dup 15 bitread
  dup /thint_obj_sz_bits exch def
  (6. Bits for the difference between max and min length of a thumbnail image.) two_column

  dup 32 bitread
  dup /thint_min_obj_cnt exch def
  (7. The least number of objects in a thumbnail image.) two_column

  dup 16 bitread
  dup /thint_obj_cnt_bits exch def
  (8. Bits for the difference between max and min number of objects in a thumbnail image.) two_column

  dup 32 bitread
  dup /thint_1st_shared_obj exch def
  (9. First object in the thumbnail shared objects section.) two_column

  dup 32 bitread
  dup /thint_1st_shared_pos exch def
  (10. Location of the first object in the thumbnail shared objects section.) two_column

  dup 32 bitread
  dup /thint_shared_cnt exch def
  (11. Number of thumbnail shared objects.) two_column

  dup 32 bitread
  dup /thint_shared_section_sz exch def
  (12. Length of the thumbnail shared objects section in bytes.) two_column

  pop
  LinearizationParams /N get

  (1. The number of preceding pages lacking a thumbnail image.) array_header
  hint_stream bytealign
  /thint_no_thumbnail_pages [
    2 index {
      hint_stream thint_no_thumbnail_bits bitread
    } repeat
  ] readonly def

  thint_no_thumbnail_pages dump_array

  (2. Number of objects in this page's thumbnail image.) array_header
  hint_stream bytealign
  /thint_page_obj_cnt [
    2 index {
      hint_stream thint_obj_cnt_bits bitread
      thint_min_obj_cnt add
    } repeat
  ] readonly def

  thint_page_obj_cnt dump_array

  (3. Length of this page's thumbnail image in bytes.) array_header
  hint_stream bytealign
  /thint_page_obj_sz [
    2 index {
      hint_stream thint_obj_sz_bits bitread
      thint_min_sz add
    } repeat
  ] readonly def

  thint_page_obj_sz dump_array
  pop
} bind def

% Analyze the generic hint table.
% The hint field names are re-used. 
/dump_generic_table { 
  hint_stream

  dup 32 bitread
  dup /ghint_1st_obj exch def
  (1. Object number of the first object in the group.) two_column

  dup 32 bitread
  dup /ghint_1st_obj_pos exch def
  (2. Location of the first object in the group.) two_column

  dup 32 bitread
  dup /ghint_obj_cnt exch def
  (3. Number of objects in the group.) two_column

  dup 32 bitread
  dup /ghint_group_sz exch def
  (4. Length of the object group in bytes.) two_column

  pop
} bind def

% Analyze the interactive hint table.
% The hint field names are re-used.
/dump_interactive_table {
  hint_stream

  dup 32 bitread
  dup /ihint_1st_obj exch def
  (1. Object number of the first object in the group.) two_column

  dup 32 bitread
  dup /ihint_1st_obj_pos exch def
  (2. Location of the first object in the group.) two_column

  dup 32 bitread
  dup /ihint_obj_cnt exch def
  (3. Number of objects in the group.) two_column

  dup 32 bitread
  dup /ihint_group_sz exch def
  (4. Length of the object group in bytes.) two_column

  dup 32 bitread
  dup /ihint_shared_cnt exch def
  (5. Number of shared object references.) two_column

  dup 16 bitread
  dup /ihint_shared_obj_bits exch def
  (6. Bits for the max shared object id used by the interactive form or the logical structure hierarchy.)
  1 index hint_sobits ne {
    (\n*** This fiels is not equal to max shared object ID bits ***) concatstrings 
  } if

  pop

  (7. Shared object identifier.) array_header
  hint_stream bytealign
  /ihint_shared_obj_id [
    ihint_shared_cnt {
      hint_stream hint_sobits bitread
    } repeat
  ] readonly def

  ihint_shared_obj_id dump_array
} bind def

% Enumerate all documented hint tables.
/dump_all_tables {  % <<stream>> dump_all_tables -
  (Page offset hint table) table_header
  hint_stream 0 set_align
  dump_page_offset_table

  (S, Shared object hint table) table_header
  dup /S .knownget {
    hint_stream exch set_align
    dump_shared_object_table
  } {
    (Required table is not found.) error_msg
  } ifelse

  dup /T .knownget {
    (T, Thumbnail hint table) table_header
    hint_stream exch set_align
    dump_thumbnail_table
  } if   

  dup /O .knownget {
    (O, Outline hint table) table_header
    hint_stream exch set_align
    dump_generic_table
  } if

  dup /A .knownget {
    (A, Thread information hint table) table_header 
    hint_stream exch set_align
    dump_generic_table
  } if

  dup /E .knownget {
    (E, Named destination hint table) table_header
    hint_stream exch set_align
    dump_generic_table
  } if

  dup /V .knownget {
    (V, Interactive form hint table) table_header
    hint_stream exch set_align
    dump_interactive_table
  } if

  dup /I .knownget {
    (I, Information dictionary hint table) table_header
    hint_stream exch set_align
    dump_generic_table
  } if

  dup /C .knownget {
    (C, Logical structure hint table) table_header
    hint_stream exch set_align
    dump_interactive_table
  } if

  dup /L .knownget {
    (L, Page label hint table) table_header
    hint_stream exch set_align
    dump_generic_table
  } if

    pop
} bind def


% Load PDF file and extract the hint stream.
/pdf_dump_hints {                             % <infile> pdf_dump_hints -
  dup (r) file                                % fname
  false exch                                  % fname F file 
  {
    dup 7 string readstring pop               % fname F file ()
    (%PDF-1.) ne { pop exit } if              % fname F file
    dup 0 setfileposition
    dup token not { pop exit } if             % fname F file obj
    dup type /integertype ne { pop exit } if  % fname F file obj
    1 index token not { pop pop exit } if     % fname F file obj gen
    dup type /integertype ne {pop pop exit}if % fname F file obj gen
    4 2 roll                                  % fname obj gen F file
    dup 0 setfileposition
    exch true or                              % fname obj gen file T
    exit
  } loop
  {
    pdfdict begin
    pdfopenfile dup begin
    40 dict begin
    /IDict exch def
    .setsafe

    % Read all objects into memory.
    Trailer touch
    resolveR                                  % fname <<>>
    dup /Linearized known {
      dup /L get                              % fname <<>> Len
      3 -1 roll status not { 0 0 0 0 } if     % <<>> Len
      pop pop exch pop                        % <<>> Len len
      eq {
        /LinearizationParams exch def
        LinearizationParams /H get
        dup length 2 eq {
          0 get PDFoffset add PDFfile exch setfileposition
          PDFfile token pop 
          PDFfile token pop
          resolveR dup true resolvestream
          /ReusableStreamDecode filter 
          bitstream dup bytealign
          /hint_stream exch def

          dump_all_tables
        } {
          pop
          (Overflow hint stream is not supported.) =
        } ifelse
      } {
        pop
        (Wrong file length in linearization dictionary.) =
      } ifelse
    } {
      pop (The file is not linearized.) =
    } ifelse
    end		% temporary dict
    end		% IDict
    end
  } {
    pop
    (Input file is not a valid PDF file.) =
  } ifelse
} bind def

% Initial setup
/dump_hints {
  counttomark 1 eq {
    exch pop
    save exch
    3000000 setvmthreshold
    pdfoptdict begin 
    pdf_dump_hints
    end
    restore
    true
  } {
    cleartomark false
  } ifelse
} bind def

/shellarguments {false} def
(pdfopt.ps) runlibfile
currentdict /shellarguments undef

% Check for command line arguments.
mark shellarguments {
  dump_hints not {
    (Usage: gs -dNODISPLAY  -- dumphint.ps input.pdf) = flush
  } if
} {
  pop
} ifelse

% EOF

Bell Labs OSI certified Powered by Plan 9

(Return to Plan 9 Home Page)

Copyright © 2021 Plan 9 Foundation. All Rights Reserved.
Comments to webmaster@9p.io.