#!/usr/bin/env python """ Convert Psion Series3 data to XML build with the fileformat description as in the psionic files Copyright (c) 2001 Geert Stappers Copyright notice: You are free to use & copy this script as long as you keep it as it is. Change permission: You are allowed the change this script as long as you publish the new version on the Internet and reference to Geert Stappers as (co-)author. Comments are welcome, sent them to Geert.Stappers@xs4all.nl todo: - update this "triple quote doc string" - length in header info for roundtripping - add extended header code, not just print statements - check if read raises EOFError - add option to set skip_deleted - add option to set try_recover """ __version__ = "$Id: s3data2xml.py,v 1.1.1.1 2002/11/05 21:02:29 stappers Exp $" # First Public Release at 15 september 2001 import struct true = 1 false = 0 skip_deleted = true skip_deleted = false try_recover = true try_recover = false Standardlength = 22 ourfiletype = 'OPLDatabaseFile' Stheader = {} recordtypes = [ 'deleted', 'mergable1', 'field_information', 'descriptive', 'private4', 'private5', 'private6', 'private7', 'mergable8', 'mergable9', 'mergable10', 'mergable11', 'mergable12', 'mergable13', 'mergable_voice', 'reserved4sys'] record = {} # empty dictionary subrecord = {} fieldtypes = [ 'word', 'long', 'real', 'qstr' ] field = ['zero'] # field[0] exists def checkheader(header): """ check the header """ #j if header[15] != 0 : # avoid that the unpack would break #j return None # not our file type name, crea_ver, len, use_ver = struct.unpack("<16shhh", header) name = name[0:15] # get rid of the trailing null if name != ourfiletype : return None # not our file type # handeling extended header # if len != Standardlength: # print "Warning: headerlength not als excepted" Stheader['name'] = name Stheader['creator'] = crea_ver Stheader['length'] = len Stheader['user'] = use_ver return 'Okay' def getrecordtal(buf): " Get record type and length, result is in dict. 'record'" low, high = struct.unpack("" def printxmlrecordtail(): " print xml record tail" print " " def printxmlfield(fn, str): print " " + str + "" def printhexvalue(buf): print " " i = 0 cbl = 0 # counter bytes at a line beginassemble = " " assemble = beginassemble while i < len(buf): assemble = assemble + " " + hex(ord(buf[i])) i = i + 1 cbl = cbl + 1 if cbl > 11: print assemble # output buffer assemble = beginassemble # clear it cbl = 0 # reset counter if assemble != beginassemble: print assemble print " " def cleandata(buf): i = 0 pcdata = '' while i < len(buf): if ord(buf[i]) >= ord(' ') and ord(buf[i]) <= ord('%'): pcdata = pcdata + buf[i] elif ord(buf[i]) >= ord('(') and ord(buf[i]) <= ord(';'): pcdata = pcdata + buf[i] elif ord(buf[i]) >= ord('@') and ord(buf[i]) <= ord('z'): pcdata = pcdata + buf[i] elif ord(buf[i]) == ord('\005'): pcdata = pcdata + "<phone/>" elif ord(buf[i]) == ord('\025'): pcdata = pcdata + "<lf/>" else: pcdata = pcdata + "&#" + repr(ord(buf[i])) + ";" i = i + 1 return pcdata def processfield_inforecord(buf): i = 1 while i <= record['length']: j = ord(buf[i-1]) field.append(fieldtypes[j]) print " " + field[i] + \ "" i = i + 1 def proc_desc_subrec_label(buf): i = 0 fn = 1 # first field number while i < subrecord['length']: j = ord(buf[i]) i = i + 1 if j > 0: label = cleandata(buf[i:i+j]) else: label = "blank" + repr(fn) #name = "label" + repr(fn) name = "label" # easier xpath finding label print " <" + name + ">" + label + "" i = i + j fn = fn + 1 def proc_desc_subrec_pd(buf): print " " + repr(ord(buf[0])) + "" print " " + buf[1:-1] + "" def proc_desc_subrec_hf(hf,cstr): print " <" + hf + " str='C'>" + cleandata(cstr[:-1]) + "" def processdescriptivesubrecord(buf): print " " if subrecord['type'] == 4: proc_desc_subrec_label(buf) elif subrecord['type'] == 7: proc_desc_subrec_pd(buf) elif subrecord['type'] == 8: proc_desc_subrec_hf("header",buf) elif subrecord['type'] == 9: proc_desc_subrec_hf("footer",buf) else: printhexvalue(buf) print " " def processdescriptiverecord(buf): i = 0 while i < record['length']: getsubrecordtal(buf[i:i+2]) i = i + 2 processdescriptivesubrecord(buf[i:i+subrecord['length']]) i = i + subrecord['length'] def processdeletedrecord(buf): if try_recover == true: if ord(buf[0]) == ord('\002') and ord(buf[1]) == ord('\020'): print " " processdescriptiverecord(buf) else: print " " processotherrecords(buf) else: printhexvalue(buf) def processotherrecords(buf): i = 0 # at the begin of "buf" fn = 1 # the first fieldnummer while i < record['length']: if field[fn] == 'qstr': ss = ord(buf[i]) i = i + 1 # next position in buffer string = cleandata(buf[i:i+ss]) printxmlfield(fn,string) i = i + ss else: print "" fn = fn + 1 def processrecord(buf): printxmlrecordhead() if record['type'] == 'field_information': processfield_inforecord(buf) elif record['type'] == 'descriptive': processdescriptiverecord(buf) elif record['type'] == 'deleted': processdeletedrecord(buf) else: processotherrecords(buf) printxmlrecordtail() def printxmlhead(): print '' print "<" + ourfiletype + ">" print "

" print " " print " " + Stheader['name'] + "" print " " + hex(Stheader['creator']) + "" print " " + repr(Stheader['length']) + "" print " " + hex(Stheader['user']) + "" print " " print " " # there should come more code print " " print " " print " " print " " print "

" print "" def printxmltail(): print "" print "" def s3data2xml(file): """" read file and if it is a OPL databasefile then continue processing """ buf = file.read(Standardlength) if checkheader(buf) != 'Okay' : print "Error: not our file type" return # exit printxmlhead() nextrecord = true try: buf = file.read(2) except EOFError: print " " nextrecord = false counter = 1 while nextrecord: getrecordtal(buf) try: buf = file.read(record['length']) except EOFError: print " " nextrecord = false break # leave while loop if record['type'] == 'deleted' and skip_deleted == true : print " " else: processrecord(buf) try: buf = file.read(2) except EOFError: nextrecord = false if len(buf) == 0: nextrecord = false counter = counter + 1 printxmltail() if __name__ == '__main__': import sys if len(sys.argv)==1: s3data2xml(sys.stdin) else: s3data2xml(open(sys.argv[1],"rb")) # end of script