home
***
CD-ROM
|
disk
|
FTP
|
other
***
search
/
Fresh Fish 5
/
FreshFish_July-August1994.bin
/
bbs
/
gnu
/
gs-2.6.1.4-bin.lha
/
lib
/
ghostscript
/
ps2ascii.ps
< prev
next >
Wrap
Text File
|
1994-07-11
|
12KB
|
392 lines
% Copyright (C) 1991, 1992, 1993 Aladdin Enterprises. All rights reserved.
%
% This file is part of Ghostscript.
%
% Ghostscript is distributed in the hope that it will be useful, but
% WITHOUT ANY WARRANTY. No author or distributor accepts responsibility
% to anyone for the consequences of using it or for whether it serves any
% particular purpose or works at all, unless he says so in writing. Refer
% to the Ghostscript General Public License for full details.
%
% Everyone is granted permission to copy, modify and redistribute
% Ghostscript, but only under the conditions described in the Ghostscript
% General Public License. A copy of this license is supposed to have been
% given to you along with Ghostscript so you can know your rights and
% responsibilities. It should be in a file named COPYING. Among other
% things, the copyright notice and this notice must be preserved on all
% copies.
% Extract the ASCII text from a PostScript file. Nothing is displayed.
% Instead, ASCII information is written to stdout. If SIMPLE is defined,
% just the text is written, with a guess at line breaks and word spacing.
% If SIMPLE is not defined, lines are written to stdout as follows:
%
% F <height> <width> (<fontname>)
% indicate font height and width of a space
%
% S <x> <y> (<string>) <width>
% display a string
%
% P
% end of page
%
% <height> is an integer expressed in tenths of a point
% <width> is an integer in tenths of a point.
% <x> and <y> are integer coordinates, in tenths of a point, with origin
% at lower left.
% <string> and <fontname> are strings represented with the standard
% PostScript escape conventions.
% The idea is similar to Glenn Reid's `distillery', only a lot more
% simple-minded, and less robust.
% Note that this code will only work in all cases if systemdict is writable
% and if `binding' the definitions of operators defined as procedures
% is deferred. For this reason, it is normally invoked with
% gs -q -dNODISPLAY -dNOBIND -dWRITESYSTEMDICT ps2ascii.ps
% Thanks to J Greely <jgreely@cis.ohio-state.edu> for improvements
% to this code.
/QUIET true def
systemdict wcheck { systemdict } { userdict } ifelse begin
/SIMPLE dup where { pop true } { false } ifelse def
% Disable the display operators.
/eofill { newpath } odef
/erasepage { } odef
/fill { newpath } odef
/stroke { newpath } odef
% The image operators must read the input, but do nothing.
/colorimage { gsave nulldevice //colorimage grestore } odef
/image { gsave nulldevice //image grestore } odef
/imagemask { gsave nulldevice //imagemask grestore } odef
% Redefine the end-of-page operators.
/copypage { SIMPLE { (\014) } { (P\n) } ifelse //print } odef
/showpage { copypage erasepage initgraphics } odef
% Redefine `show'.
% Set things up so our output will be in tenths of a point, with origin at
% lower left. This isolates us from the peculiarities of individual devices.
/.show.ident.matrix matrix def
/.show.ident
% { //.show.ident.matrix defaultmatrix
% % Assume the original transformation is well-behaved.
% 0.1 0 2 index dtransform abs exch abs max /.show.scale exch def
% 0.1 dup 3 -1 roll scale
{ gsave initmatrix
% Assume the original transformation is well-behaved.
0.1 0 dtransform abs exch abs max /.show.scale exch def
0.1 dup scale .show.ident.matrix currentmatrix
grestore
} bind def
/.coord
{ transform .show.ident itransform
exch round cvi exch round cvi
} odef
/.dcoord
{ % Transforming distances is trickier, because
% the coordinate system might be rotated.
.show.ident pop
exch 0 dtransform
% dup 0 ne { dup mul exch dup mul add sqrt } { pop abs } ifelse
dup mul exch dup mul add sqrt
.show.scale div round cvi
exch 0 exch dtransform
% exch dup 0 ne { dup mul exch dup mul add sqrt } { pop abs } ifelse
dup mul exch dup mul add sqrt
.show.scale div round cvi
} odef
% Define a way to store and retrieve integers that survives save/restore.
/.i.string ( ) def
/.iget { cvi } bind def
/.iput { exch //.i.string exch copy cvs pop } bind def
/.inew { //.i.string length string dup 3 -1 roll .iput } bind def
/.show.x 0 .inew def
/.show.y 0 .inew def
/.show.height 1000 .inew def
% Remember the last character of the previous string; if it was a
% hyphen preceded by a letter, we didn't output the hyphen.
/.show.last (\000) def
% Make sure writing will work even if a program uses =string.
/.show.string =string length string def
/.show.=string =string length string def
/.show==only
{ //=string //.show.=string copy pop
dup type /stringtype eq
{ dup length //.show.string length le
{ dup rcheck { //.show.string copy } if
} if
} if
//.stdout exch write==only
//.show.=string //=string copy pop
} odef
/.showfont
%(following comments are from J Greely)
%old code - This didn't work right for me with all fonts.
%
% { 0 currentfont /FontBBox get dup 3 get exch 1 get sub
% currentfont /FontMatrix get dtransform dtransform
% exch abs exch abs max round
% (F ) //print //.stdout exch write==only (\n) //print
% } odef
%
%unfortunately, my way bombs on one of my test files in
%--%show_continue--(?!). It's from dvi2ps, which molests
%the fonts in some way. --jgreely
{ gsave
% If we can't get the height and width of the font from
% the FontBBox, we just measure some characters.
currentfont /FontBBox .knownget not { {0 0 0 0} } if
aload pop exch 4 -1 roll sub 3 1 roll exch sub
2 copy max 0 ne
{ currentfont /FontMatrix get dtransform
}
{ % Unfortunately, charpath is broken in some versions,
% so we use stringwidth and fudge.
(X) stringwidth pop dup 1.3 mul
}
ifelse .dcoord exch
currentfont /FontName .knownget not { () } if
dup type /nametype eq { //.show.string cvs } if
grestore
% Stack: height width fontname
SIMPLE
{ pop pop //.show.height exch .iput }
{ (F ) //print 3
{ 2 index .show==only ( ) //print 3 -1 roll } repeat
pop pop pop (\n) //print
}
ifelse
} odef
% Define the letters -- characters which, if they occur followed by a hyphen
% at the end of a line, cause the hyphen and line break to be ignored.
/.letter.chars 100 dict def
mark
65 1 90 { dup 32 add } for
counttomark { StandardEncoding exch get .letter.chars exch dup put } repeat
pop
% Define a set of characters which, if they occur at the start of a line,
% are taken as indicating a paragraph break.
/.break.chars 50 dict def
mark
/bullet /dagger /daggerdbl /periodcentered /section
counttomark { .break.chars exch dup put } repeat
pop
% Define character translation to ASCII.
% We have to do this for the entire character set.
/.char.map 500 dict def
/.chars.def { counttomark 2 idiv { .char.map 3 1 roll put } repeat pop } def
% Encode the printable ASCII characters.
mark 32 1 126
{ 1 string dup 0 4 -1 roll put
dup 0 get StandardEncoding exch get exch
}
for .chars.def
% Encode accents.
mark
/acute (') /caron (^) /cedilla (,) /circumflex (^)
/dieresis (") /grave (`) /ring (*) /tilde (~)
.chars.def
% Encode the ISO accented characters.
mark 192 1 255
{ ISOLatin1Encoding exch get =string cvs
dup 0 1 getinterval 1 index dup length 1 sub 1 exch getinterval
.char.map 2 index known .char.map 2 index known and
{ .char.map 3 -1 roll get .char.map 3 -1 roll get concatstrings
.char.map 3 1 roll put
}
{ pop pop pop
}
ifelse
}
for .chars.def
% Encode the remaining standard and ISO alphabetic characters.
mark
/AE (AE) /Eth (DH) /OE (OE) /Thorn (Th)
/ae (ae) /eth (dh)
/ffi (ffi) /ffl (ffl) /fi (fi) /fl (fl)
/germandbls (ss) /oe (oe) /thorn (th)
.chars.def
% Encode the other standard and ISO characters.
mark
/brokenbar (|) /bullet (*) /copyright ((C)) /currency (#)
/dagger (#) /daggerdbl (##) /degree (o) /divide (/) /dotaccent (.)
/dotlessi (i)
/ellipsis (...) /emdash (--) /endash (-) /exclamdown (!)
/florin (f) /fraction (/)
/guillemotleft (<<) /guillemotright (>>)
/guilsingleft (<) /guilsingright (>) /hungarumlaut ("") /logicalnot (~)
/macron (_) /minus (-) /mu (u) /multiply (*)
/ogonek (,) /onehalf (1/2) /onequarter (1/4) /onesuperior (1)
/