#!/usr/bin/env python # Portions Copyright (C) 2001-2021 Artifex Software Inc. # # This software is distributed under license and may not be copied, modified # or distributed except as expressly authorized under the terms of that # license. Refer to licensing information at http://www.artifex.com/ or # contact Artifex Software, Inc., 1305 Grant Avenue - Suite 200, # Novato, CA 94945, (415)492-9861, for further information. # # TODO # array data should be wrapped. # # text data should be printed as a string not an array of ascii values. # # enumerations should printed we now print the ordinal value of the enumeration. # # make self.unpack endian like with binding # DIFFS between HP # Artifex reports the file offset of each operator HP does not. #Python 3 compat mode for Python2 must be the first line (without conditionals): # 'from __future__ imports must occur at the beginning of the file' from __future__ import print_function, unicode_literals import sys if sys.version < '3': def chr_(x): return x def ord_(x): return ord(x) def unpackB(x): return unpack(b'B', x)[0] def b(x): return x.encode() else: def chr_(x): return chr(x) def ord_(x): return x def unpackB(x): return x def b(x): return x # for packing and unpacking binary data from struct import * # tags pxl_tags_dict = { 'ArcPath' : 0x91, 'BeginChar' : 0x52, 'BeginFontHeader' : 0x4f, 'BeginImage' : 0xb0, 'BeginPage' : 0x43, 'BeginRastPattern' : 0xb3, 'BeginScan' : 0xb6, 'BeginSession' : 0x41, 'BeginStream' : 0x5b, 'BeginUserDefinedLineCap' : 0x82, 'BezierPath' : 0x93, 'BezierRelPath' : 0x95, 'Chord' : 0x96, 'ChordPath' : 0x97, 'CloseDataSource' : 0x49, 'CloseSubPath' : 0x84, 'Comment' : 0x47, 'Ellipse' : 0x98, 'EllipsePath' : 0x99, 'EndChar' : 0x54, 'EndFontHeader' : 0x51, 'EndImage' : 0xb2, 'EndPage' : 0x44, 'EndRastPattern' : 0xb5, 'EndScan' : 0xb8, 'EndSession' : 0x42, 'EndStream' : 0x5d, 'EndUserDefinedLineCaps' : 0x83, 'ExecStream' : 0x5e, 'LinePath' : 0x9b, 'LineRelPath' : 0x9d, 'NewPath' : 0x85, 'OpenDataSource' : 0x48, 'PaintPath' : 0x86, 'Passthrough' : 0xbf, 'Pie' : 0x9e, 'PiePath' : 0x9f, 'PopGS' : 0x60, 'PushGS' : 0x61, 'ReadChar' : 0x53, 'ReadFontHeader' : 0x50, 'ReadImage' : 0xb1, 'ReadRastPattern' : 0xb4, 'ReadStream' : 0x5c, 'Rectangle' : 0xa0, 'RectanglePath' : 0xa1, 'RemoveFont' : 0x55, 'RemoveStream' : 0x5f, 'RoundRectangle' : 0xa2, 'RoundRectanglePath' : 0xa3, 'ScanLineRel' : 0xb9, 'SetAdaptiveHalftoning' : 0x94, 'SetBrushSource' : 0x63, 'SetCharAttributes' : 0x56, 'SetCharAngle' : 0x64, 'SetCharBoldValue' : 0x7d, 'SetCharScale' : 0x65, 'SetCharShear' : 0x66, 'SetCharSubMode' : 0x81, 'SetClipIntersect' : 0x67, 'SetClipMode' : 0x7f, 'SetClipRectangle' : 0x68, 'SetClipReplace' : 0x62, 'SetClipToPage' : 0x69, 'SetColorSpace' : 0x6a, 'SetColorTrapping' : 0x92, 'SetColorTreatment' : 0x58, 'SetCursor' : 0x6b, 'SetCursorRel' : 0x6c, 'SetDefaultGS' : 0x57, 'SetHalftoneMethod' : 0x6d, 'SetFillMode' : 0x6e, 'SetFont' : 0x6f, 'SetLineCap' : 0x71, 'SetLineDash' : 0x70, 'SetLineJoin' : 0x72, 'SetMiterLimit' : 0x73, 'SetNeutralAxis' : 0x7e, 'SetPageDefaultCTM' : 0x74, 'SetPageOrigin' : 0x75, 'SetPageRotation' : 0x76, 'SetPageScale' : 0x77, 'SetPathToClip' : 0x80, 'SetPatternTxMode' : 0x78, 'SetPenSource' : 0x79, 'SetPenWidth' : 0x7a, 'SetROP' : 0x7b, 'SetSourceTxMode' : 0x7c, 'Text' : 0xa8, 'TextPath' : 0xa9, 'VendorUnique' : 0x46, 'attr_ubyte' : 0xf8, 'attr_uint16' : 0xf9, 'embedded_data' : 0xfa, 'embedded_data_byte' : 0xfb, 'real32' : 0xc5, 'real32_array' : 0xcd, 'real32_box' : 0xe5, 'real32_xy' : 0xd5, 'sint16' : 0xc3, 'sint16_array' : 0xcb, 'sint16_box' : 0xe3, 'sint16_xy' : 0xd3, 'sint32' : 0xc4, 'sint32_array' : 0xcc, 'sint32_box' : 0xe4, 'sint32_xy' : 0xd4, 'ubyte' : 0xc0, 'ubyte_array' : 0xc8, 'ubyte_box' : 0xe0, 'ubyte_xy' : 0xd0, 'uint16' : 0xc1, 'uint16_array' : 0xc9, 'uint16_box' : 0xe1, 'uint16_xy' : 0xd1, 'uint32' : 0xc2, 'uint32_array' : 0xca, 'uint32_box' : 0xe2, 'uint32_xy' : 0xd2 } pxl_enumerations_dict = { 'ArcDirection' : [ 'eClockWise=0', 'eCounterClockWise=1' ], 'BackCh' : ['eErrorPage=0'], # deprecated. 'CharSubModeArray' : [ 'eNoSubstitution=0', 'eVerticalSubstitution=1' ], 'ClipMode' : ['eNonZeroWinding=0', 'eEvenOdd=1' ], 'ClipRegion' : ['eInterior=0', 'eExterior=1'], 'ColorDepth' : [ 'e1Bit=0', 'e4Bit=1', 'e8Bit=2' ], 'ColorMapping' : [ 'eDirectPixel=0', 'eIndexedPixel=1' ], 'ColorSpace' : [ 'eGray=1', 'eRGB=2', 'eSRGB=6', 'eGraySub=7'], # srgb deprecated 'ColorTreatment' : [ 'eNoTreatment=0', 'eScreenMatch=1', 'eVivid=2' ], 'CompressMode' : [ 'eNoCompression=0', 'eRLECompression=1', 'eJPEGCompression=2', 'eDeltaRowCompression=3' ], 'DataOrg' : [ 'eBinaryHighByteFirst=0', 'eBinaryLowByteFirst=1' ], 'DataSource' : [ 'eDefault=0' ], 'DataType' : [ 'eUByte=0', 'eSByte=1', 'eUint16=2', 'eSint16=3' ], 'DitherMatrix' : [ 'eDeviceBest=0' ], 'DuplexPageMode' : [ 'eDuplexHorizontalBinding=0', 'eDuplexVerticalBinding=1' ], 'DuplexPageSide' : [ 'eFrontMediaSide=0', 'eBackMediaSide=1' ], 'ErrorReport' : ['eNoReporting=0', 'eBackChannel=1', 'eErrorPage=2', 'eBackChAndErrPage=3', 'eNWBackChannel=4', 'eNWErrorPage=5', 'eNWBackChAndErrPage=6' ], 'FillMode' : ['eNonZeroWinding=0', 'eEvenOdd=1' ], 'LineJoineMiterJoin' : [ 'eRoundJoin=0', 'eBevelJoin=1', 'eNoJoin=2' ], 'MediaSource' : [ 'eDefaultSource=0', 'eAutoSelect=1', 'eManualFeed=2', 'eMultiPurposeTray=3', 'eUpperCassette=4', 'eLowerCassette=5', 'eEnvelopeTray=6', 'eThirdCassette=7', 'External Trays=8-255' ], 'MediaDestination' : [ 'eDefaultDestination=0', 'eFaceDownBin=1', 'eFaceUpBin=2', 'eJobOffsetBin=3', 'External Bins=5-255' ], 'LineCapStyle' : [ 'eButtCap=0', 'eRoundCap=1', 'eSquareCap=2', 'eTriangleCap=3' ], 'LineJoin' : [ 'eMiterJoin=0', 'eRoundJoin=1', 'eBevelJoin=2', 'eNoJoin=3' ], 'Measure' : [ 'eInch=0', 'eMillimeter=1', 'eTenthsOfAMillimeter=2' ], 'MediaSize' : [ 'eDefault=96', 'eLetterPaper=0', 'eLegalPaper=1', 'eA4Paper=2', 'eExecPaper=3', 'eLedgerPaper=4', 'eA3Paper=5', 'eCOM10Envelope=6', 'eMonarchEnvelope=7', 'eC5Envelope=8', 'eDLEnvelope=9', 'eJB4Paper=10', 'eJB5Paper=11', 'eB5Paper=13', 'eB5Envelope=12', 'eJPostcard=14', 'eJDoublePostcard=15', 'eA5Paper=16', 'eA6Paper=17', 'eJBPaper=18', 'JIS8K=19', 'JIS16K=20', 'JISExec=21' ], 'Orientation' : ['ePortraitOrientation=0', 'eLandscapeOrientation=1', 'eReversePortrait=2', 'eReverseLandscape=3', 'eDefaultOrientation=4' ], 'PatternPersistence' : [ 'eTempPattern=0', 'ePagePattern=1', 'eSessionPattern=2'], 'SimplexPageMode' : ['eSimplexFrontSide=0'], 'TxMode' : [ 'eOpaque=0', 'eTransparent=1' ], 'VUExtension' : [ 'HP_ColorSmartRGB=68186216', #0x04107068 'HP_ColorSmartRGB=1752174596', #0x68701004 'HP_SelectTrayBinByString=1752178693', #0x68702005 'EnterFRMode=1752178694', #0x68702006 'FRExtension=1752178705', #0x68702011 'JR3BeginImage=1752186880', #0x68704000 'JR3ReadImage=1752186881' , #0x68704001 'JR3EndImage=1752186882' , #0x68704002 'JR3ExecStream=1752186883', #0x68704003 ], 'WritingMode' : [ 'eHorizontal=0', 'eVertical=1' ] } # see appendix F pxl_attribute_name_to_attribute_number_dict = { 'AllObjectTypes' : 29, 'ArcDirection' : 65, 'BlockByteLength' : 111, 'BlockHeight' : 99, 'BoundingBox' : 66, 'ColorimetricColorSpace': 17, # deprecated 'CharAngle' : 161, 'CharBoldValue' : 177, 'CharCode' : 162, 'CharDataSize' : 163, 'CharScale' : 164, 'CharShear' : 165, 'CharSize' : 166, 'CharSubModeArray' : 172, 'ClipMode' : 84, 'ClipRegion' : 83, 'ColorDepth' : 98, 'ColorMapping' : 100, 'ColorSpace' : 3, 'ColorTreatment' : 120, 'CommentData' : 129, 'CompressMode' : 101, 'ControlPoint1' : 81, 'ControlPoint2' : 82, 'CRGBMinMax' : 20, # deprecated 'CustomMediaSize' : 47, 'CustomMediaSizeUnits' : 48, 'DashOffset' : 67, 'DataOrg' : 130, 'DestinationBox' : 102, 'DestinationSize' : 103, 'DeviceMatrix' : 33, 'DitherMatrixDataType' : 34, 'DitherMatrixDepth' : 51, 'DitherMatrixSize' : 50, 'DitherOrigin' : 35, 'DuplexPageMode' : 53, 'DuplexPageSide' : 54, 'EllipseDimension' : 68, 'EndPoint' : 69, 'ErrorReport' : 143, 'FillMode' : 70, 'FontFormat' : 169, 'FontHeaderLength' : 167, 'FontName' : 168, 'GammaGain' : 21, # deprecated. 'GrayLevel' : 9, 'LineCapStyle' : 71, 'LineDashStyle' : 74, 'LineJoinStyle' : 72, 'Measure' : 134, 'MediaDestination' : 36, 'MediaSize' : 37, 'MediaSource' : 38, 'MediaType' : 39, 'MiterLength' : 73, 'NewDestinationSize' : 13, 'NullBrush' : 4, 'NullPen' : 5, 'NumberOfPoints' : 77, 'NumberOfScanLines' : 115, 'Orientation' : 40, 'PCLSelectFont' : 141, 'PadBytesMultiple' : 110, 'PageAngle' : 41, 'PageCopies' : 49, 'PageOrigin' : 42, 'PageScale' : 43, 'PaletteData' : 6, 'PaletteDepth' : 2, 'PatternDefineID' : 105, 'PatternOrigin' : 12, 'PatternPersistence' : 104, 'PatternSelectID' : 8, 'PenWidth' : 75, 'Point' : 76, 'PointType' : 80, 'PrimaryArray' : 14, 'PrimaryDepth' : 15, 'PrintableArea' : 116, 'RGBColor' : 11, 'ROP3' : 44, 'RasterObjects' : 32, 'SimplexPageMode' : 52, 'SolidLine' : 78, 'SourceHeight' : 107, 'SourceType' : 136, 'SourceWidth' : 108, 'StartLine' : 109, 'StartPoint' : 79, 'StreamDataLength' : 140, 'StreamName' : 139, 'SymbolSet' : 170, 'TextData' : 171, 'TextObjects' : 30, 'TxMode' : 45, 'UnitsPerMeasure' : 137, 'VectorObjects' : 31, 'VUExtension' : 145, 'VUDataLength' : 146, 'VUAttr1' : 147, 'VUAttr2' : 148, 'VUAttr3' : 149, 'VUAttr4' : 150, 'VUAttr5' : 151, 'VUAttr6' : 152, 'WhiteReferencePoint' : 19, # deprecated. 'WritingMode' : 173, # deprecated. 'XSpacingData' : 175, 'XYChromaticities' : 18, # deprecated. 'YSpacingData' : 176, } printables = ''.join([(len(repr(chr(x)))==3) and (x != 47) and (x < 128) and chr(x) or '.' for x in range(256)]) class pxl_dis: def __init__(self, data): # the class does not handle pjl, work around that here. NB # should check for little endian protocol but we haven't seen # it used yet. index = data.index(b") HP-PCL XL;") # copy of the data without the PJL data = data[index:] self.data = data # parse out data order and protocol self.binding = chr_(data[0]) self.protocol = chr_(data[12]) self.revision = chr_(data[14]) # check binding NB - should check other stuff too: # example: )HP-PCL XL;2;0 if self.binding not in ['(', ')']: if (self.binding == '`'): print("The PXL code is already ascii encoded\n", file=sys.stderr) raise(SyntaxError) # replace with python's struct endian flag. if (self.binding == ')'): # little endian self.binding = '<' else: self.binding = '>' # save the what we skipped over so we can record file offsets self.skipped_over = index # pointer to data self.index = 0 # graphic state number of pushes - number of pops self.graphics_state_level = 0 # print out ascii protocol and revision. NB should check # revisions are the same. print("` HP-PCL XL;" + self.protocol + ";" + self.revision) # saved size of last array parsed self.size_of_element = -1; self.size_of_array = -1; self.unpack_string = "" # skip over protocol and revision while( chr_(data[self.index]) != '\n' ): self.index = self.index + 1 self.index = self.index + 1 # dictionary of streams keyed by stream name self.user_defined_streams = {} # the n'th operator in the stream self.operator_position = 0 # The VendorUnique operator can have an optional embedded payload # where the length is stored in the VUDataLength attribute. # We need to cache the value of that atttribute to skip over # that many number of bytes when it is encountered. self.VUDataLength = 0 # true if we get UEL self.endjob = 0 # redefine unpack to handle endiannes def unpack(self, format, data): # prepend the binding to specify the endianness of the XL # stream and standard format, not native. (see struct.py docs) return unpack((b(self.binding) + b(format)), data) # implicitly read when parsing the tag def attributeIDValue(self): return 1 def findTagKey(self, tag): for key in pxl_tags_dict: if ( pxl_tags_dict[key] == tag ): return key return 0 # get the next operator def operatorTag(self): tag = unpackB(self.data[self.index]) key = self.findTagKey(tag) if (not key): return 0 if ( key == "PopGS" ): self.graphics_state_level = self.graphics_state_level - 1 if ( key == "PushGS" ): self.graphics_state_level = self.graphics_state_level + 1 if (not self.isEmbedded(key)): self.operator_position = self.operator_position + 1 print("// Op Pos: %d " % self.operator_position, end=' ') print("Op fOff: %d " % (self.index + self.skipped_over), end=' ') print("Op Hex: %X " % tag, end=' ') print("Level: %d" % self.graphics_state_level) print(key) self.index = self.index + 1 # handle special cases if (self.isEmbedded(key) or (key == 'VendorUnique')): self.process_EmbeddedInfo(key) return 1 def Tag_ubyte(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['ubyte'] ): self.index = self.index + 1 print("ubyte", end=' ') self.unpack_string = 'B' self.size_of_element = 1 return 1 return 0 def Tag_sint16(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['sint16'] ): self.index = self.index + 1 print("sint16", end=' ') self.unpack_string = 'h' self.size_of_element = 2 return 1 return 0 def Tag_uint16(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['uint16'] ): self.index = self.index + 1 print("uint16", end=' ') self.unpack_string = 'H' self.size_of_element = 2 return 1 return 0 def Tag_sint32(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['sint32'] ): self.index = self.index + 1 print("sint32", end=' ') self.unpack_string = 'i' self.size_of_element = 4 return 1 return 0 def Tag_uint32(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['uint32'] ): self.index = self.index + 1 print("uint32", end=' ') self.unpack_string = 'I' self.size_of_element = 4 return 1 return 0 def Tag_real32(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['real32'] ): self.index = self.index + 1 print("real32", end=' ') self.unpack_string = 'f' self.size_of_element = 4 return 1 return 0 def Tag_ubyte_array(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['ubyte_array'] ): self.index = self.index + 1 self.unpack_string = 'B' self.size_of_element = 1 print("ubyte_array [", end=' ') return 1 return 0 def Tag_uint16_array(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['uint16_array'] ): self.index = self.index + 1 self.unpack_string = 'H' self.size_of_element = 2 print("uint16_array [", end=' ') return 1 return 0 def Tag_sint16_array(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['sint16_array'] ): self.index = self.index + 1 self.unpack_string = 'h' self.size_of_element = 2 print("sint16_array [", end=' ') return 1 return 0 def Tag_uint32_array(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['uint32_array'] ): self.index = self.index + 1 self.unpack_string = 'I' self.size_of_element = 4 print("uint32_array [", end=' ') return 1 return 0 def Tag_sint32_array(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['sint32_array'] ): self.index = self.index + 1 self.unpack_string = 'i' self.size_of_element = 4 print("sint32_array [", end=' ') return 1 return 0 def Tag_real32_array(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['real32_array'] ): self.index = self.index + 1 self.unpack_string = 'f' self.size_of_element = 4 print("real32_array [", end=' ') return 1 return 0 def Tag_ubyte_xy(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['ubyte_xy'] ): self.index = self.index + 1 print("ubyte_xy %d %d" % \ self.unpack('BB', self.data[self.index:self.index+2]), end=' ') self.index = self.index + 2 return 1 return 0 def Tag_uint16_xy(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['uint16_xy'] ): self.index = self.index + 1 print("uint16_xy %d %d" % \ self.unpack('HH', self.data[self.index:self.index+4]), end=' ') self.index = self.index + 4 return 1 return 0 def Tag_sint16_xy(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['sint16_xy'] ): self.index = self.index + 1 print("sint16_xy %d %d" % \ self.unpack('hh', self.data[self.index:self.index+4]), end=' ') self.index = self.index + 4 return 1 return 0 def Tag_uint32_xy(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['uint32_xy'] ): self.index = self.index + 1 print("uint32_xy" % \ self.unpack('II', self.data[self.index:self.index+8]), end=' ') self.index = self.index + 8 return 1 return 0 def Tag_sint32_xy(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['sint32_xy'] ): self.index = self.index + 1 print("sint32_xy %d %d" % \ self.unpack('ii', self.data[self.index:self.index+8]), end=' ') self.index = self.index + 8 return 1 return 0 def Tag_real32_xy(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['real32_xy'] ): self.index = self.index + 1 print("real32_xy %f %f" % \ self.unpack('ff', self.data[self.index:self.index+8]), end=' ') self.index = self.index + 8 return 1 return 0 def Tag_ubyte_box(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['ubyte_box'] ): self.index = self.index + 1 print("ubyte_box %d %d %d %d" % \ self.unpack('BBBB', self.data[self.index:self.index+4]), end=' ') self.index = self.index + 4 return 1 return 0 def Tag_uint16_box(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['uint16_box'] ): self.index = self.index + 1 print("uint16_box %d %d %d %d" % \ self.unpack('hhhh', self.data[self.index:self.index+8]), end=' ') self.index = self.index + 8 return 1 return 0 def Tag_sint16_box(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['sint16_box'] ): self.index = self.index + 1 print("sint16_box %d %d %d %d" % \ self.unpack('hhhh', self.data[self.index:self.index+8])) self.index = self.index + 8 return 1 return 0 def Tag_uint32_box(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['uint32_box'] ): self.index = self.index + 1 print("uint32_box %d %d %d %d" % \ self.unpack('IIII', self.data[self.index:self.index+16])) self.index = self.index + 32 return 1 return 0 def Tag_sint32_box(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['sint32_box'] ): self.index = self.index + 1 print("sint32_box %d %d %d %d" % \ self.unpack('iiii', self.data[self.index:self.index+16])) self.index = self.index + 16 return 1 return 0 def Tag_real32_box(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['real32_box'] ): self.index = self.index + 1 print("real32_box %f %f %f %f" % \ self.unpack('ffff', self.data[self.index:self.index+16])) self.index = self.index + 16 return 1 return 0 def dump(self, src): N=0 result=[] while src: s,src = src[:16],src[16:] hexa = ' '.join(["%02X"% ord_(x) for x in s]) s = ''.join(printables[ord_(x)] for x in s) result += "%04X %-*s %s\n" % (N, 16*3, hexa, s) N+=16 return ''.join(result) # check for embedded tags. def isEmbedded(self, name): return ( name == 'embedded_data' or name == 'embedded_data_byte') def process_EmbeddedInfo(self, name): if ( name == 'embedded_data' ): length = self.unpack('I', self.data[self.index:self.index+4])[0] self.index = self.index + 4 if ( name == 'embedded_data_byte' ): length = int(self.unpack('B', self.data[self.index:self.index+1])[0]) self.index = self.index + 1 if ( name == 'VendorUnique' ): length = self.VUDataLength self.VUDataLength = 0 print("length:", end=' ') print(length) print("[") print(self.dump(self.data[self.index:self.index+length])) print("]") self.index = self.index + length def Tag_attr_ubyte(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['attr_ubyte'] ): self.index = self.index + 1 tag = unpackB(self.data[self.index]) for k in pxl_attribute_name_to_attribute_number_dict: if ( pxl_attribute_name_to_attribute_number_dict[k] == tag ): if (k == 'VUDataLength'): # The VUDataLength is only ever seen with the CLJ3500/3550/3600 # as part of an optional VendorUnque payload; it is possible # that its value type can be something else other than uint32. # We'll just backtrack to get a uint32 value, and raise an error # if it isn't uint32. vu_tag = unpackB(self.data[self.index-6]) if ( vu_tag == pxl_tags_dict['uint32'] ): self.VUDataLength = int(self.unpack('I', self.data[self.index-5:self.index-1])[0]) else: raise(SyntaxError)("VUDataLength not uint32") print(k, end='') if (k in pxl_enumerations_dict): print(" //", end=' ') searchstr = "=" + str(self.saved_value) enum = pxl_enumerations_dict[k] enumeration_not_found = 1 for value in enum: if ( value[value.index('='):] == searchstr ): enumeration_not_found = 0 print(value) break if (enumeration_not_found): # we print here mainly to to avoid side effect # of the // above if no enumeration is found. print('Unknown enumeration') else: print() self.index = self.index + 1 # handle special cases if ( self.isEmbedded(k) ): self.process_EmbeddedInfo(k) return 1 print("Unlisted attribute number:", tag, file=sys.stderr) raise(SyntaxError)("Unlisted attribute number in PXL stream") return 0 def Tag_attr_uint16(self): new_tag = unpackB(self.data[self.index]) if ( new_tag == pxl_tags_dict['attr_uint16'] ): self.index = self.index + 1 print("Attribute tag uint16 # NOT IMPLEMENTED #", self.unpack('HH', self.data[self.index] )) self.index = self.index + 2 return 1 return 0 def attributeID(self): return (self.Tag_attr_ubyte() or self.Tag_attr_uint16()) and self.attributeIDValue() def singleValueType(self): if ( self.Tag_ubyte() or self.Tag_uint16() or self.Tag_uint32() or \ self.Tag_sint16() or self.Tag_sint32() or self.Tag_real32() ): size = self.size_of_element if ( self.unpack_string == 'f' ): print("%f" % self.unpack(self.unpack_string, self.data[self.index:self.index+size]), end=' ') else: print("%d" % self.unpack(self.unpack_string, self.data[self.index:self.index+size]), end=' ') if (( self.unpack_string == 'B' and size == 1 ) or \ ( self.unpack_string == 'I' and size == 4 )): self.saved_value = self.unpack(self.unpack_string, self.data[self.index:self.index+size])[0] self.index = self.index + self.size_of_element return 1 return 0 def xyValueType(self): return self.Tag_ubyte_xy() or self.Tag_uint16_xy() or self.Tag_uint32_xy() or \ self.Tag_sint16_xy() or self.Tag_sint32_xy() or self.Tag_real32_xy() def boxValueType(self): return self.Tag_ubyte_box() or self.Tag_uint16_box() or self.Tag_uint32_box() or \ self.Tag_sint16_box() or self.Tag_sint32_box() or self.Tag_real32_box() def valueType(self): return self.singleValueType() or self.xyValueType() or self.boxValueType() def arraySizeType(self): return self.Tag_ubyte() or self.Tag_uint16() def arraySize(self): # save the old unpack string for the type of the array, the data type for the size # will replace it. unpack_string = self.unpack_string size_of_element = self.size_of_element if ( self.arraySizeType() ): self.size_of_array = self.unpack( self.unpack_string, \ self.data[self.index:self.index+self.size_of_element] )[0] print(self.size_of_array, end='') self.index = self.index + self.size_of_element # restore the unpack string self.unpack_string = unpack_string self.size_of_element = size_of_element return 1 return 0 def singleValueArrayType(self): return self.Tag_ubyte_array() or self.Tag_uint16_array() or \ self.Tag_uint32_array() or self.Tag_sint16_array() or \ self.Tag_sint32_array() or self.Tag_real32_array() def arrayType(self): if (self.singleValueArrayType() and self.arraySize()): array_size = self.size_of_element * self.size_of_array array_elements = self.unpack( str(self.size_of_array) + self.unpack_string, \ self.data[self.index:self.index+array_size] ) # hex dump byte arrays if (self.size_of_element == 1): print() print(self.dump(self.data[self.index:self.index+array_size])) print("]", end=' ') else: print(end=' ') for num in array_elements: print(num, end=' ') print("]", end=' ') self.index = self.index + array_size return 1 return 0 def dataType(self): return( self.valueType() or self.arrayType() or self.boxValueType() ) # these get parsed when doing the tags def numericValue(self): return 1; def attributeValue(self): return( self.dataType() and self.numericValue() ) def singleAttributePair(self): return( self.attributeValue() and self.attributeID() ) def multiAttributeList(self): # NB should be many 1+ not sure how this get handled yet return( self.singleAttributePair() ) def nullAttributeList(self): # NB not sure return 0 def attributeList(self): return (self.singleAttributePair() or self.multiAttributeList() or self.nullAttributeList()) def attributeLists(self): # save the beginning of the attribute list even if it is # empty. So we can report the position of the command. self.begin_attribute_pos = self.index # 0 or more attribute lists while( self.attributeList() ): continue return 1 def UEL(self): if ( self.data[self.index:self.index+9] == b"\033%-12345X" ): print('string* \\x1B%-12345X') self.index = self.index + 9 self.endjob = 1; return 1 return 0 def operatorSequences(self): while ( self.attributeLists() and self.operatorTag() ) or self.UEL(): print() if ( self.endjob == 1 ): raise IndexError # hack see below else: continue def disassemble(self): try: self.operatorSequences() # assume an index error means we have processed everything - ugly except IndexError: return except KeyboardInterrupt: print("^C pressed. Terminating...", file=sys.stderr) return except IOError as msg: # broken pipe when user quits a downsream pager if msg.args == (32,'Broken pipe'): print("Broken pipe...", file=sys.stderr) return else: raise else: print("dissassemble failed at file position %d" % self.index, file=sys.stderr) endpos = min(len(self.data), self.index + 25) for byte in self.data[self.index:endpos]: print(hex(ord(byte)), end=' ', file=sys.stderr) print() if __name__ == '__main__': import sys if not sys.argv[1:]: print("Usage: %s pxl files" % sys.argv[0]) files = sys.argv[1:] for file in files: try: fp = open(file, 'rb') except: print("Cannot find file %s" % file) continue # read the whole damn thing. If this get too cumbersome we # can switch to string i/o which will use a disk pxl_code = fp.read() fp.close() # initialize and disassemble. pxl_stream = pxl_dis(pxl_code) pxl_stream.disassemble()