skia2/experimental/PdfViewer/spec2def.py

611 lines
26 KiB
Python

#!/usr/local/bin/python
# coding: utf-8
import sys
import re
# TODO(edisonn): put processed part of file in a new file
# put unprocessed part, in a new file, so we see what we miss
# keep blank lines, and generate a version without the blank lines
#TODO (edisonn): deal manually with tables that don't have "KEY TYPE VALUE' header, e.g.
# TABLE 7.11 Restrictions on the entries in a soft-mask image dictionary
#KEY RESTRICTION
lines = 0
table = ''
tableHeaderFound = False
tableLine = 0
tableRow = 0
columnWidth = []
columnValues = None
mustFollowTableHeader = False
emitedDitionaryName = ''
knownTypes = {
'(any)',
unicode('undefined', 'utf8'),
'(undefined)',
'(various)',
'array',
'or',
'boolean',
'date',
'dictionary',
'function',
'integer',
unicode('file', 'utf8'),
'file',
unicode('specification', 'utf8'),
'specification',
'name',
'tree',
'number',
'rectangle',
'stream',
'string',
'text',
',',
' '
}
# TODO(edisonn): add a third element in the vector, the base class, by default it is Dictionary
# TODO(edisonn): add overrides for types map<field_name, type_name>
# e.g. ,{'Resources', 'ResourceDictionary'}
# TODO(edisonn): can be added one by one, or extracted from documentation
tableToClassName = {
'TABLE 3.4': ['StreamCommonDictionary', 'Entries common to all stream dictionaries'],
'TABLE 3.7': ['LzwdecodeAndFlatedecodeFiltersDictionary', 'Optional parameters for LZWDecode and FlateDecode filters'],
'TABLE 3.9': ['CcittfaxdecodeFilterDictionary', 'Optional parameters for the CCITTFaxDecode filter'],
'TABLE 3.10': ['Jbig2DecodeFilterDictionary', 'Optional parameter for the JBIG2Decode filter'],
'TABLE 3.11': ['DctdecodeFilterDictionary', 'Optional parameter for the DCTDecode filter'],
'TABLE 3.12': ['FileTrailerDictionary', 'Entries in the file trailer dictionary'],
'TABLE 3.13': ['EncryptionCommonDictionary', 'Entries common to all encryption dictionaries'],
'TABLE 3.14': ['StandardSecurityHandlerDictionary', 'Additional encryption dictionary entries for the standard security handler'],
'TABLE 3.16': ['CatalogDictionary', 'Entries in the catalog dictionary'],
'TABLE 3.17': ['PageTreeNodeDictionary', 'Required entries in a page tree node'],
'TABLE 3.18': ['PageObjectDictionary', 'Entries in a page object'],
'TABLE 3.19': ['NameDictionary', 'Entries in the name dictionary'],
'TABLE 3.21': ['ResourceDictionary', 'Entries in a resource dictionary'],
'TABLE 3.23': ['NameTreeNodeDictionary', 'Entries in a name tree node dictionary'],
'TABLE 3.25': ['NumberTreeNodeDictionary', 'Entries in a number tree node dictionary'],
'TABLE 3.26': ['FunctionCommonDictionary', 'Entries common to all function dictionaries'],
'TABLE 3.27': ['Type0FunctionDictionary', 'Additional entries specific to a type 0 function dictionary'],
'TABLE 3.28': ['Type2FunctionDictionary', 'Additional entries specific to a type 2 function dictionary'],
'TABLE 3.29': ['Type3FunctionDictionary', 'Additional entries specific to a type 3 function dictionary'],
'TABLE 3.32': ['FileSpecificationDictionary', 'Entries in a file specification dictionary'],
'TABLE 3.33': ['EmbeddedFileStreamDictionary', 'Additional entries in an embedded file stream dictionary'],
'TABLE 3.34': ['EmbeddedFileParameterDictionary', 'Entries in an embedded file parameter dictionary'],
'TABLE 3.35': ['MacOsFileInformationDictionary', 'Entries in a Mac OS file information dictionary'],
'TABLE 4.8': ['GraphicsStateDictionary', 'Entries in a graphics state parameter dictionary'],
'TABLE 4.13': ['CalgrayColorSpaceDictionary', 'Entries in a CalGray color space dictionary'],
'TABLE 4.14': ['CalrgbColorSpaceDictionary', 'Entries in a CalRGB color space dictionary'],
'TABLE 4.15': ['LabColorSpaceDictionary', 'Entries in a Lab color space dictionary'],
'TABLE 4.16': ['IccProfileStreamDictionary', 'Additional entries specific to an ICC profile stream dictionary'],
'TABLE 4.20': ['DeviceNColorSpaceDictionary', 'Entry in a DeviceN color space attributes dictionary'],
'TABLE 4.22': ['Type1PatternDictionary', 'Additional entries specific to a type 1 pattern dictionary'],
'TABLE 4.23': ['Type2PatternDictionary', 'Entries in a type 2 pattern dictionary'],
'TABLE 4.25': ['ShadingDictionary', 'Entries common to all shading dictionaries'],
'TABLE 4.26': ['Type1ShadingDictionary', 'Additional entries specific to a type 1 shading dictionary', 'ShadingDictionary'],
'TABLE 4.27': ['Type2ShadingDictionary', 'Additional entries specific to a type 2 shading dictionary', 'ShadingDictionary'],
'TABLE 4.28': ['Type3ShadingDictionary', 'Additional entries specific to a type 3 shading dictionary', 'ShadingDictionary'],
'TABLE 4.29': ['Type4ShadingDictionary', 'Additional entries specific to a type 4 shading dictionary', 'ShadingDictionary'],
'TABLE 4.30': ['Type5ShadingDictionary', 'Additional entries specific to a type 5 shading dictionary', 'ShadingDictionary'],
'TABLE 4.31': ['Type6ShadingDictionary', 'Additional entries specific to a type 6 shading dictionary', 'ShadingDictionary'],
'TABLE 4.35': ['ImageDictionary', 'Additional entries specific to an image dictionary', 'XObjectDictionary', {'Subtype': 'datatypes.PdfName(\'Image\')'}],
'TABLE 4.37': ['AlternateImageDictionary', 'Entries in an alternate image dictionary'],
'TABLE 4.41': ['Type1FormDictionary', 'Additional entries specific to a type 1 form dictionary', 'XObjectDictionary', {'Subtype': 'datatypes.PdfName(\'Form\')'}],
'TABLE 4.42': ['GroupAttributesDictionary', 'Entries common to all group attributes dictionaries'],
'TABLE 4.43': ['ReferenceDictionary', 'Entries in a reference dictionary'],
'TABLE 4.44': ['PSXobjectDictionary', 'Additional entries specific to a PostScript XObject dictionary'],
'TABLE 5.8': ['Type1FontDictionary', 'Entries in a Type 1 font dictionary', 'FontDictionary'],
'TABLE 5.9': ['Type3FontDictionary', 'Entries in a Type 3 font dictionary', 'FontDictionary'],
'TABLE 5.11': ['EncodingDictionary', 'Entries in an encoding dictionary'],
'TABLE 5.12': ['CIDSystemInfoDictionary', 'Entries in a CIDSystemInfo dictionary'],
'TABLE 5.13': ['CIDFontDictionary', 'Entries in a CIDFont dictionary', 'FontDictionary'],
'TABLE 5.16': ['CMapDictionary', 'Additional entries in a CMap dictionary'],
'TABLE 5.17': ['Type0FontDictionary', 'Entries in a Type 0 font dictionary', 'FontDictionary'],
'TABLE 5.18': ['FontDescriptorDictionary', 'Entries common to all font descriptors'],
'TABLE 5.20': ['CIDFontDescriptorDictionary', 'Additional font descriptor entries for CIDFonts'],
'TABLE 5.23': ['EmbeddedFontStreamDictionary', 'Additional entries in an embedded font stream dictionary'],
'TABLE 6.3': ['Type1HalftoneDictionary', 'Entries in a type 1 halftone dictionary'],
'TABLE 6.4': ['Type6HalftoneDictionary', 'Additional entries specific to a type 6 halftone dictionary'],
'TABLE 6.5': ['Type10HalftoneDictionary', 'Additional entries specific to a type 10 halftone dictionary'],
'TABLE 6.6': ['Type16HalftoneDictionary', 'Additional entries specific to a type 16 halftone dictionary'],
'TABLE 6.7': ['Type5HalftoneDictionary', 'Entries in a type 5 halftone dictionary'],
'TABLE 7.10': ['SoftMaskDictionary', 'Entries in a soft-mask dictionary'],
'TABLE 7.12': ['SoftMaskImageDictionary', 'Additional entry in a soft-mask image dictionary'],
'TABLE 7.13': ['TransparencyGroupDictionary', 'Additional entries specific to a transparency group attributes dictionary'],
'TABLE 8.1': ['ViewerPreferencesDictionary', 'Entries in a viewer preferences dictionary'],
'TABLE 8.3': ['OutlineDictionary', 'Entries in the outline dictionary'],
'TABLE 8.4': ['OutlineItemDictionary', 'Entries in an outline item dictionary'],
'TABLE 8.6': ['PageLabelDictionary', 'Entries in a page label dictionary'],
'TABLE 8.7': ['ThreadDictionary', 'Entries in a thread dictionary'],
'TABLE 8.8': ['BeadDictionary', 'Entries in a bead dictionary'],
'TABLE 8.9': ['TransitionDictionary', 'Entries in a transition dictionary'],
'TABLE 8.10': ['AnnotationDictionary', 'Entries common to all annotation dictionaries'],
'TABLE 8.12': ['BorderStyleDictionary', 'Entries in a border style dictionary'],
'TABLE 8.13': ['AppearanceDictionary', 'Entries in an appearance dictionary'],
'TABLE 8.15': ['TextAnnotationDictionary', 'Additional entries specific to a text annotation'],
'TABLE 8.16': ['ALinkAnnotationDictionary', 'Additional entries specific to a link annotation'],
'TABLE 8.17': ['FreeTextAnnotationDictionary', 'Additional entries specific to a free text annotation'],
'TABLE 8.18': ['LineAnnotationDictionary', 'Additional entries specific to a line annotation'],
'TABLE 8.20': ['SquareOrCircleAnnotation', 'Additional entries specific to a square or circle annotation'],
'TABLE 8.21': ['MarkupAnnotationsDictionary', 'Additional entries specific to markup annotations'],
'TABLE 8.22': ['RubberStampAnnotationDictionary', 'Additional entries specific to a rubber stamp annotation'],
'TABLE 8.23': ['InkAnnotationDictionary', 'Additional entries specific to an ink annotation'],
'TABLE 8.24': ['PopUpAnnotationDictionary', 'Additional entries specific to a pop-up annotation'],
'TABLE 8.25': ['FileAttachmentAnnotationDictionary', 'Additional entries specific to a file attachment annotation'],
'TABLE 8.26': ['SoundAnnotationDictionary', 'Additional entries specific to a sound annotation'],
'TABLE 8.27': ['MovieAnnotationDictionary', 'Additional entries specific to a movie annotation'],
'TABLE 8.28': ['WidgetAnnotationDictionary', 'Additional entries specific to a widget annotation'],
'TABLE 8.29': ['ActionDictionary', 'Entries common to all action dictionaries'],
'TABLE 8.30': ['AnnotationActionsDictionary', 'Entries in an annotation\'s additional-actions dictionary'],
'TABLE 8.31': ['PageObjectActionsDictionary', 'Entries in a page object\'s additional-actions dictionary'],
'TABLE 8.32': ['FormFieldActionsDictionary', 'Entries in a form field\'s additional-actions dictionary'],
'TABLE 8.33': ['DocumentCatalogActionsDictionary', 'Entries in the document catalog\'s additional-actions dictionary'],
'TABLE 8.35': ['GoToActionDictionary', 'Additional entries specific to a go-to action'],
'TABLE 8.36': ['RemoteGoToActionDictionary', 'Additional entries specific to a remote go-to action'],
'TABLE 8.37': ['LaunchActionDictionary', 'Additional entries specific to a launch action'],
'TABLE 8.38': ['WindowsLaunchActionDictionary', 'Entries in a Windows launch parameter dictionary'],
'TABLE 8.39': ['ThreadActionDictionary', 'Additional entries specific to a thread action'],
'TABLE 8.40': ['URIActionDictionary', 'Additional entries specific to a URI action'],
'TABLE 8.41': ['URIDictionary', 'Entry in a URI dictionary'],
'TABLE 8.42': ['SoundActionDictionary', 'Additional entries specific to a sound action'],
'TABLE 8.43': ['MovieActionDictionary', 'Additional entries specific to a movie action'],
'TABLE 8.44': ['HideActionDictionary', 'Additional entries specific to a hide action'],
'TABLE 8.46': ['NamedActionsDictionary', 'Additional entries specific to named actions'],
'TABLE 8.47': ['InteractiveFormDictionary', 'Entries in the interactive form dictionary'],
'TABLE 8.49': ['FieldDictionary', 'Entries common to all field dictionaries'],
'TABLE 8.51': ['VariableTextFieldDictionary', 'Additional entries common to all fields containing variable text'],
'TABLE 8.52': ['AppearanceCharacteristicsDictionary', 'Entries in an appearance characteristics dictionary'],
'TABLE 8.54': ['CheckboxFieldDictionary', 'Additional entry specific to a checkbox field'],
'TABLE 8.55': ['RadioButtonFieldDictionary', 'Additional entry specific to a radio button field'],
'TABLE 8.57': ['TextFieldDictionary', 'Additional entry specific to a text field'],
'TABLE 8.59': ['ChoiceFieldDictionary', 'Additional entries specific to a choice field'],
'TABLE 8.60': ['SignatureDictionary', 'Entries in a signature dictionary'],
'TABLE 8.61': ['SubmitFormActionDictionary', 'Additional entries specific to a submit-form action'],
'TABLE 8.63': ['ResetFormActionDictionary', 'Additional entries specific to a reset-form action'],
'TABLE 8.65': ['ImportDataActionDictionary', 'Additional entries specific to an import-data action'],
'TABLE 8.66': ['JavascriptActionDictionary', 'Additional entries specific to a JavaScript action'],
'TABLE 8.67': ['FDFTrailerDictionary', 'Entry in the FDF trailer dictionary'],
'TABLE 8.68': ['FDFCatalogDictionary', 'Entries in the FDF catalog dictionary'],
'TABLE 8.69': ['FDFDictionary', 'Entries in the FDF dictionary'],
'TABLE 8.70': ['EncryptedEmbeddedFileStreamDictionary', 'Additional entry in an embedded file stream dictionary for an encrypted FDF file'],
'TABLE 8.71': ['JavascriptDictionary', 'Entries in the JavaScript dictionary'],
'TABLE 8.72': ['FDFFieldDictionary', 'Entries in an FDF field dictionary'],
'TABLE 8.73': ['IconFitDictionary', 'Entries in an icon fit dictionary'],
'TABLE 8.74': ['FDFPageDictionary', 'Entries in an FDF page dictionary'],
'TABLE 8.75': ['FDFTemplateDictionary', 'Entries in an FDF template dictionary'],
'TABLE 8.76': ['FDFNamedPageReferenceDictionary', 'Entries in an FDF named page reference dictionary'],
'TABLE 8.77': ['FDFFileAnnotationDictionary', 'Additional entry for annotation dictionaries in an FDF file'],
'TABLE 8.78': ['SoundObjectDictionary', 'Additional entries specific to a sound object'],
'TABLE 8.79': ['MovieDictionary', 'Entries in a movie dictionary'],
'TABLE 8.80': ['MovieActivationDictionary', 'Entries in a movie activation dictionary'],
'TABLE 9.2': ['DocumentInformationDictionary', 'Entries in the document information dictionary'],
'TABLE 9.3': ['MetadataStreamDictionary', 'Additional entries in a metadata stream dictionary'],
'TABLE 9.4': ['ComponentsWithMetadataDictionary', 'Additional entry for components having metadata'],
'TABLE 9.6': ['PagePieceDictionary', 'Entries in a page-piece dictionary'],
'TABLE 9.7': ['ApplicationDataDictionary', 'Entries in an application data dictionary'],
'TABLE 9.9': ['StructureTreeRootDictionary', 'Entries in the structure tree root'],
'TABLE 9.10': ['StructureElementDictionary', 'Entries in a structure element dictionary'],
'TABLE 9.11': ['MarkedContentReferenceDictionary', 'Entries in a marked-content reference dictionary'],
'TABLE 9.12': ['ObjectReferenceDictionary', 'Entries in an object reference dictionary'],
'TABLE 9.13': ['StructureElementAccessDictionary', 'Additional dictionary entries for structure element access'],
'TABLE 9.14': ['AttributeObjectDictionary', 'Entry common to all attribute objects'],
'TABLE 9.15': ['MarkInformationDictionary', 'Entry in the mark information dictionary'],
'TABLE 9.16': ['ArtifactsDictionary', 'Property list entries for artifacts'],
'TABLE 9.27': ['StandardStructureDictionary', 'Standard layout attributes common to all standard structure types'],
'TABLE 9.28': ['BlockLevelStructureElementsDictionary', 'Additional standard layout attributes specific to block-level structure elements'],
'TABLE 9.29': ['InlineLevelStructureElementsDictionary', 'Standard layout attributes specific to inline-level structure elements'],
'TABLE 9.30': ['ListAttributeDictionary', 'Standard list attribute'],
'TABLE 9.31': ['TableAttributesDictionary', 'Standard table attributes'],
'TABLE 9.32': ['WebCaptureInformationDictionary', 'Entries in the Web Capture information dictionary'],
'TABLE 9.33': ['WebCaptureDictionary', 'Entries common to all Web Capture content sets'],
'TABLE 9.34': ['WebCapturePageSetDictionary', 'Additional entries specific to a Web Capture page set'],
'TABLE 9.35': ['WebCaptureImageSetDictionary', 'Additional entries specific to a Web Capture image set'],
'TABLE 9.36': ['SourceInformationDictionary', 'Entries in a source information dictionary'],
'TABLE 9.37': ['URLAliasDictionary', 'Entries in a URL alias dictionary'],
'TABLE 9.38': ['WebCaptureCommandDictionary', 'Entries in a Web Capture command dictionary'],
'TABLE 9.40': ['WebCaptureCommandSettingsDictionary', 'Entries in a Web Capture command settings dictionary'],
'TABLE 9.41': ['BoxColorInformationDictionary', 'Entries in a box color information dictionary'],
'TABLE 9.42': ['BoxStyleDictionary', 'Entries in a box style dictionary'],
'TABLE 9.43': ['PrinterMarkAnnotationDictionary', 'Additional entries specific to a printer\'s mark annotation'],
'TABLE 9.44': ['PrinterMarkFormDictionary', 'Additional entries specific to a printer\'s mark form dictionary'],
'TABLE 9.45': ['SeparationDictionary', 'Entries in a separation dictionary'],
'TABLE 9.46': ['PDF_XOutputIntentDictionary', 'Entries in a PDF/X output intent dictionary'],
'TABLE 9.47': ['TrapNetworkAnnotationDictionary', 'Additional entries specific to a trap network annotation'],
'TABLE 9.48': ['TrapNetworkAppearanceStreamDictionary', 'Additional entries specific to a trap network appearance stream'],
'TABLE 9.49': ['OpiVersionDictionary', 'Entry in an OPI version dictionary'],
}
def acceptType(val):
global knownTypes
ret = val
for item in knownTypes:
ret = ret.replace(item, '')
return ret == ''
def inTable():
global tableHeaderFound
return tableHeaderFound
def tableDescriptionFound(desc):
global table
table = desc.strip()
def tableHasHeader():
global table
global tableHeaderFound
tableHeaderFound = True
#print table
def fix(val):
ret = val
# fix unicode chars
ret = ret.replace(unicode('', 'utf8'), 'fi')
ret = ret.replace(u'\u201c', '\"')
ret = ret.replace(u'\u201d', '\"')
ret = ret.replace(u'\u2019', '\'')
ret = ret.replace(u'\ufb02', 'fl')
ret = ret.replace(u'\xae', '(R)')
ret = ret.replace(u'\u2026', '...')
ret = ret.replace(u'\xd7', 'x')
ret = ret.replace(u'\u2212', '-')
ret = ret.replace(u'\u2264', '<=')
ret = ret.replace(u'\u2014', '-')
ret = ret.replace(u'\u2013', '\'')
ret = ret.replace(u'\u2022', '*')
ret = ret.replace(u'\xb5', 'mu')
ret = ret.replace(u'\xf7', '/')
# how enable to emit this a python string
ret = ret.replace('\'', '\\\'')
ret = ret.replace('\n', '\\n')
return ret
def commitRow():
global columnValues
global emitedDitionaryName
global table
global tableToClassName
if columnValues == None:
return
#print columnValues
lastClosed = columnValues[2].find(')')
if lastClosed < 0:
print 'ERRRRRRRRRRRRRRROR'
print columnValues
return
spec = columnValues[2][:lastClosed + 1]
spec = spec.replace('(', ';')
spec = spec.replace(')', ';')
spec = spec.strip(';')
specs = spec.split(';')
# clearly required, but it can be required with conditions. don't handle this ones here, but manually
required = specs[0] == 'Required'
inheritable = False
version = ''
for s in specs:
if s.strip() == 'inheritable' or s.strip() == 'Inheritable':
inheritable = True
elif re.match('^PDF [0-9]*[\.[0-9]*]*', s.strip()):
version = s.strip()
elif s != 'Required':
required = False
#print spec
#print specs
#print required
#print inheritable
#print version
#print columnValues
columnValues = [fix(columnValues[0]), fix(columnValues[1]), fix(columnValues[2])]
tableKey = re.search('(TABLE [0-9].[0-9][0-9]?)', table).group(1)
if emitedDitionaryName == '':
table = fix(table)
#print table
emitedDitionaryName = 'foo'
e = re.search('[Entries|Entry] in [a-z]* (.* dictionary)', table)
a = re.search('Additional [a-z]* in a[n]? (.* dictionary)', table)
s = re.search('Additional [a-z]* (.*)', table)
c = re.search('[Entries|Entry] common to all (.*)', table)
o1 = re.search('Optional parameter[s]? for the (.*)', table)
o2 = re.search('Optional parameter[s]? for (.*)', table)
t = re.search('.*ntries in [a-z]* (.*)', table)
r = re.search('Property list entries for (.*)', table)
st = re.search('Standard (.*)', table)
if e:
emitedDitionaryName = e.group(1).title().replace(' ', '')
#print emitedDitionaryName
elif a:
emitedDitionaryName = a.group(1).title().replace(' ', '')
#print emitedDitionaryName
elif s:
emitedDitionaryName = s.group(1).title().replace(' ', '')
#print emitedDitionaryName
elif c:
emitedDitionaryName = c.group(1).title().replace(' ', '') + 'Common'
#print emitedDitionaryName
elif o1:
emitedDitionaryName = o1.group(1).title().replace(' ', '') + 'OptionalParameters'
#print emitedDitionaryName
elif o2:
emitedDitionaryName = o2.group(1).title().replace(' ', '') + 'OptionalParameters'
#print emitedDitionaryName
elif t:
emitedDitionaryName = t.group(1).title().replace(' ', '') + 'Dictionary'
#print emitedDitionaryName
elif r:
emitedDitionaryName = r.group(1).title().replace(' ', '') + 'Dictionary'
#print emitedDitionaryName
elif st:
emitedDitionaryName = st.group(1).title().replace(' ', '') + 'Dictionary'
#print emitedDitionaryName
#else:
#print table
#print tableKey
#print('\'' + tableKey + '\': [\'' + emitedDitionaryName + '\', \'' + table[len(tableKey) + 1:] + '\'],')
emitedDitionaryName = tableToClassName[tableKey][0]
comment = fix(tableToClassName[tableKey][1])
if len(tableToClassName[tableKey]) >= 3 and tableToClassName[tableKey][2] != '':
print(' pdfspec.addClass(\'' + emitedDitionaryName + '\', \'' + tableToClassName[tableKey][2] + '\', \'' + comment + '\')\\')
else:
print(' pdfspec.addClass(\'' + emitedDitionaryName + '\', \'Dictionary\', \'' + comment + '\')\\')
if len(tableToClassName[tableKey]) >= 4 and columnValues[0] in tableToClassName[tableKey][3]:
required = True
if required:
print(' .required(\'NULL\')\\')
else:
print(' .optional()\\')
print(' .field(\'' + columnValues[0] + '\')\\')
print(' .name(\'' + columnValues[0] + '\')\\')
print(' .type(\'' + columnValues[1] + '\')\\')
print(' .comment(\'' + columnValues[2] + '\')\\')
if len(tableToClassName[tableKey]) >= 4 and columnValues[0] in tableToClassName[tableKey][3]:
print(' .must(' + tableToClassName[tableKey][3][columnValues[0]] + ')\\')
print(' .done().done()\\')
columnValues = None
def newRow(first, second, third):
global columnValues
columnValues = [first.rstrip(), second.rstrip(), third.rstrip()]
def appendRow(second, third):
global columnValues
if second.rstrip() != '':
columnValues[1] = columnValues[1] + ' ' + second.rstrip()
if third.rstrip() != '':
columnValues[2] = columnValues[2] + '\n' + third.rstrip()
def rebaseTable(line):
global knownTypes
global columnWidth
line2 = line.replace(',', ' , ')
words = line2.split()
if len(words) < 3:
return False
i = 1
while i < len(words) - 1 and words[i] in knownTypes:
i = i + 1
if words[i].startswith('(Optional') or words[i].startswith('(Required'):
commitRow()
columnWidth[0] = line.find(words[1])
if words[i].startswith('(Optional'):
columnWidth[1] = line.find('(Optional') - columnWidth[0]
if words[i].startswith('(Required'):
columnWidth[1] = line.find('(Required') - columnWidth[0]
return True
return False
def stopTable():
global tableHeaderFound
global emitedDitionaryName
if not inTable():
return
commitRow()
tableHeaderFound = False
emitedDitionaryName = ''
print(' .done()')
print
def killTable():
return
def processLineCore(line):
global lines
global tableLine
global tableRow
global columnWidth
global columnValues
global mustFollowTableHeader
global fnewspec
lines = lines + 1
line = unicode(line, 'utf8')
striped = line.rstrip()
words = line.split()
if len(words) == 0:
stopTable()
return False
isTableHeader = re.search('^[\s]*(TABLE [0-9].[0-9][0-9]?)', striped)
if isTableHeader:
stopTable()
tableDescriptionFound(striped)
mustFollowTableHeader = True
return False
if mustFollowTableHeader:
mustFollowTableHeader = False
if len(words) != 3:
killTable()
return False
# TODO(edisonn): support for generic table!
if words[0] != 'KEY' or words[1] != 'TYPE' or words[2] != 'VALUE':
killTable()
return False
tableHasHeader()
columnWidth = [0, 0, 0]
columnWidth[0] = striped.index('TYPE')
columnWidth[1] = striped.index('VALUE') - striped.index('TYPE')
columnWidth[2] = 0
return True
if inTable():
tableLine = tableLine + 1
first = striped[0 : columnWidth[0]]
second = striped[columnWidth[0] : columnWidth[0] + columnWidth[1]]
third = striped[columnWidth[0] + columnWidth[1] :]
if tableLine == 1:
if third[0] != '(':
killTable()
return False
newRow(first, second, third)
return True
if rebaseTable(striped):
first = striped[0 : columnWidth[0]]
second = striped[columnWidth[0] : columnWidth[0] + columnWidth[1]]
third = striped[columnWidth[0] + columnWidth[1] :]
first = first.rstrip()
second = second.rstrip()
third = third.rstrip()
if first == '' and second == '' and third != '':
appendRow(second, third)
return True
if len(first.split()) > 1:
stopTable()
return False
if first != '' and first[0] == ' ':
stopTable()
return False
if first != '' and second != '' and third == '':
stopTable()
return False
if first == '' and second != '' and second[0] != ' ':
if acceptType(second):
appendRow(second, third)
return True
else:
stopTable()
return False
if first != '' and second != '' and third[0] != '(':
stopTable()
return False
if first == '' and second != '' and second[0] == ' ':
stopTable()
return False
if first != '' and second != '' and third[0] == '(':
commitRow()
newRow(first, second, third)
return True
return False
return False
def processLine(line):
global fnewspec
inSpec = processLineCore(line)
#just return, use the next lines if you wish to rewrite spec
return
if inSpec:
#resize colum with types
line = line[:columnWidth[0] + columnWidth[1]] + (' ' * (60 - columnWidth[1])) + line[columnWidth[0] + columnWidth[1]:]
line = line[:columnWidth[0]] + (' ' * (40 - columnWidth[0])) + line[columnWidth[0]:]
fnewspec.write(line)
def generateDef():
global lines
global fnewspec
#fnewspec = open('PdfReference-okular-2.txt', 'w')
print 'import datatypes'
print
print 'def buildPdfSpec(pdfspec):'
for line in sys.stdin:
processLine(line)
# close last table if it was not closed already
stopTable()
print
#print lines
#fnewspec.close()
if '__main__' == __name__:
sys.exit(generateDef())