examples/benchmarks.py
author robin
Fri, 23 Dec 2016 12:55:22 +0000
changeset 56 51219ad2b0bd
parent 53 3a3f172a62bf
permissions -rw-r--r--
speed up windows 3.6 build
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
1
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
     1
# benchmark
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
     2
# MSXML:  This can be downloaded from many places.  You need 3.0
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
     3
# which is NOT in most newly installed Windows boxes. (650kb)
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
     4
# http://download.microsoft.com/download/xml/Install/3.0/WIN98Me/EN-US/msxml3.exe
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
     5
#    for a quick tutorial on MSXML 3.0, see
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
     6
# http://www.perfectxml.com/articles/xml/msxml30.asp
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
     7
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
     8
# you should then run the COM MakePY utility on the Pythonwin menu.
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
     9
# to get it going as fast as possible.
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    10
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    11
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    12
import sys
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    13
import glob
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    14
import time
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    15
import string
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    16
from types import TupleType
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    17
import cStringIO
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    18
    
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    19
def tupleTreeStats(node):
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    20
    # counts tags and attributes recursively
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    21
    # use for all reportlab parsers
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    22
    if node[1] is None:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    23
        attrCount = 0
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    24
    else:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    25
        attrCount = len(node[1])
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    26
    nodeCount = 1
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    27
    if node[2] is not None:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    28
        for child in node[2]:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    29
            if type(child) is TupleType:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    30
                a, n = tupleTreeStats(child)
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    31
                attrCount = attrCount + a
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    32
                nodeCount = nodeCount + n
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    33
    return attrCount, nodeCount
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    34
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    35
###  pyRXP - our wrapper around Univ of Edinburgh
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    36
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    37
def getPyRXPParser():
53
3a3f172a62bf benchmarks.py: import pyRXPU rather than pyRXP
Matthew Pitkin <pitkin@gmail.com>
parents: 11
diff changeset
    38
    import pyRXPU
3a3f172a62bf benchmarks.py: import pyRXPU rather than pyRXP
Matthew Pitkin <pitkin@gmail.com>
parents: 11
diff changeset
    39
    p = pyRXPU.Parser()
1
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    40
    return p
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    41
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    42
def getNonValidatingPyRXPParser():
53
3a3f172a62bf benchmarks.py: import pyRXPU rather than pyRXP
Matthew Pitkin <pitkin@gmail.com>
parents: 11
diff changeset
    43
    import pyRXPU
3a3f172a62bf benchmarks.py: import pyRXPU rather than pyRXP
Matthew Pitkin <pitkin@gmail.com>
parents: 11
diff changeset
    44
    p = pyRXPU.Parser(Validate=0)
1
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    45
    return p
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    46
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    47
def parseWithPyRXP(parser, rawdata):
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    48
    return parser.parse(rawdata)
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    49
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    50
###  rparsexml - Aaron's very fast pure python parser
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    51
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    52
def loadRparseXML():
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    53
    #it's a module, what the heck
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    54
    from reportlab.lib import rparsexml
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    55
    return rparsexml
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    56
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    57
def parseWithRParseXML(rparsexml, rawdata):
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    58
    #first argument is a dummy holding none
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    59
    return rparsexml.parsexml0(rawdata)[0] 
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    60
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    61
###  expattree - tree-building wrapper around pyexpat
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    62
def getExpatParser():
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    63
    import expattree
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    64
    return expattree.ExpatTreeParser()
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    65
    
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    66
def parseWithExpat(expatParser, rawdata):
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    67
    #first argument is a dummy holding none
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    68
    return expatParser.parse(rawdata)
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    69
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    70
####### minidom - non-validating DOM parser in the Python distro
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    71
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    72
def loadMiniDOM():
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    73
    import xml.dom.minidom
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    74
    return xml.dom.minidom
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    75
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    76
def parseWithMiniDOM(dom_module, rawdata):
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    77
    #parser is None
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    78
    return dom_module.parseString(rawdata)
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    79
    
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    80
def statsWithMiniDOM(node):
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    81
    return (1, 0)
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    82
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    83
#########  Microsoft XML Parser via COM ######################
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    84
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    85
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    86
def loadMSXML30():
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    87
    from win32com.client import Dispatch
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    88
    msx = Dispatch('Microsoft.XMLDOM')
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    89
    return msx
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    90
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    91
def parseWithMSXML30(msx, rawdata):
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    92
    msx.loadXML(rawdata)
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    93
    return msx
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    94
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    95
def statsWithMSXML30(node):
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    96
    #not done
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    97
    return (1,0)    
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    98
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
    99
###########4DOM ###############
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   100
def load4DOM():
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   101
    from xml.dom.ext.reader import PyExpat
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   102
    from xml.dom import Node
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   103
    reader = PyExpat.Reader()
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   104
    return reader
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   105
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   106
def parseWith4DOM(reader, rawdata):
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   107
    return reader.fromString(rawdata)
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   108
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   109
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   110
def statsWith4DOM(node):
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   111
    #node
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   112
    return (1,0)
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   113
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   114
def loadCDomlette():
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   115
    from Ft.Lib import cDomlettec
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   116
    return cDomlettec
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   117
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   118
def parseWithCDomlette(modul, rawdata):
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   119
    io = cStringIO.StringIO(rawdata)
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   120
    return modul.parse(io, '')
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   121
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   122
def statsWithCDomlette(node):
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   123
    #node
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   124
    return (1,0)
10
c4180c9ff648 added .hgeol .hgignore
rptlab
parents: 2
diff changeset
   125
1
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   126
##########put them all together################
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   127
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   128
TESTMAP = [
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   129
    # name of parser; function to initialize if needed;
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   130
    # function to parse; function to do stats
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   131
    ('pyRXP', getPyRXPParser, parseWithPyRXP, tupleTreeStats),
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   132
    ('pyRXP_nonvalidating', getNonValidatingPyRXPParser, parseWithPyRXP, tupleTreeStats),
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   133
    ('rparsexml', loadRparseXML, parseWithRParseXML, tupleTreeStats),
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   134
    ('expat', getExpatParser, parseWithExpat, tupleTreeStats),
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   135
    ('minidom', loadMiniDOM, parseWithMiniDOM, statsWithMiniDOM),
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   136
    ('msxml30', loadMSXML30, parseWithMSXML30, statsWithMSXML30),
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   137
    ('4dom', load4DOM, parseWith4DOM, statsWith4DOM),
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   138
    ('cdomlette', loadCDomlette, parseWithCDomlette, statsWithCDomlette)
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   139
    ]    
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   140
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   141
def interact(testName=None, dtd=1, pause='unknown'):
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   142
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   143
    # if no DTD requested, trim off first 2 lines; the lack of
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   144
    # a DTD reference will put validating parsers into non-
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   145
    # validating mode
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   146
    if dtd:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   147
        sampleText = open('rml_a.xml').read()
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   148
    else:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   149
        print 'DTD declaration removed, non-validating'
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   150
        lines = open('rml_a.xml').readlines()[2:]
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   151
        sampleText = string.join(lines,'')
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   152
        
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   153
    if testName:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   154
        found = 0
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   155
        for row in TESTMAP:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   156
            if row[0] == testName:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   157
                found = 1
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   158
                (name, loadFunc, parseFunc, statFunc) = row
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   159
                break
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   160
        if not found:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   161
            print 'parser %s not found, please select' % testName
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   162
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   163
    if not testName:            
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   164
    # interactive, show stuff
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   165
        print "Interactive benchmark suite for Python XML tree-parsers."
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   166
        print 'Using sample XML file %d bytes long' % len(sampleText)
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   167
        print "Parsers available:"
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   168
        i = 1
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   169
        for (name, a, b, c) in TESTMAP:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   170
            print '\t%d.  %s' % (i, name)
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   171
            i = i + 1
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   172
        print
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   173
        inp = raw_input('Parser number (or x to exit) > ')
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   174
        if inp == 'x':
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   175
            print 'bye'
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   176
            return
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   177
        else:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   178
            num = int(inp)
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   179
            (name, loadFunc, parseFunc, statFunc) = TESTMAP[num-1]
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   180
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   181
    # force pause to 1 or 0 by asking
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   182
    if pause == 'unknown': 
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   183
        inp = raw_input("Shall we do memory tests?  i.e. you look at Task Manager? y/n > ")
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   184
        assert inp in 'yn', 'enter "y" or "n".  Please run again!'
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   185
        pause = (inp == 'y')
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   186
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   187
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   188
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   189
    print 'testing %s' % testName
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   190
    #load the parser
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   191
    t0 = time.clock()
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   192
    parser = loadFunc()
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   193
    loadTime = time.clock() - t0
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   194
    if pause:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   195
        baseMem = float(raw_input("Pre-parsing: please input python process memory in kb > "))
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   196
    t1 = time.clock()
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   197
    parsedOutput = parseFunc(parser, sampleText)
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   198
    t2 = time.clock()
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   199
    parseTime = t2 - t1
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   200
    
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   201
    if pause:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   202
        totalMem = float(raw_input('Post-parsing: please input python process memory in kb > '))
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   203
        usedMem = totalMem - baseMem
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   204
        memFactor = usedMem * 1024.0 / len(sampleText)
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   205
    t3 = time.clock()
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   206
    n, a = statFunc(parsedOutput)
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   207
    t4 = time.clock()
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   208
    traverseTime = t4 - t3
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   209
    print 'counted %d tags, %d attributes' % (n, a)
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   210
    if pause:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   211
        print '%s: init %0.4f, parse %0.4f, traverse %0.4f, mem used %dkb, mem factor %0.2f' % (
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   212
            name, loadTime, parseTime, traverseTime, usedMem, memFactor)
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   213
    else:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   214
        print '%s: init %0.4f, parse %0.4f, traverse %0.4f' % (
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   215
            name, loadTime, parseTime, traverseTime)
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   216
    print
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   217
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   218
    
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   219
if __name__=='__main__':
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   220
    import sys
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   221
    args = sys.argv[:]
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   222
    if '-nodtd' in args:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   223
        dtd=0
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   224
        args.remove('-nodtd')
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   225
    else:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   226
        dtd=1
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   227
        
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   228
    if '-pause' in args:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   229
        pause = 1
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   230
        args.remove('-pause')
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   231
    elif '-nopause' in args:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   232
        pause = 0
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   233
        args.remove('-nopause')
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   234
    else:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   235
        pause = 'unknown'  # it will ask
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   236
    if len(args) > 1:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   237
        testName = args[1]
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   238
    else:
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   239
        testName = None
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   240
    interact(testName, dtd, pause=pause)
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   241
    
7cf042be50ba Move pyRXP into its own universe
rgbecker
parents:
diff changeset
   242