/usr/share/w3af/extlib/nltk/olac.py is in w3af-console 1.0-rc3svn3489-1.
This file is owned by root:root, with mode 0o644.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 | # Natural Language Toolkit: Support for OLAC Metadata
#
# Copyright (C) 2001-2009 NLTK Project
# Author: Steven Bird <sb@csse.unimelb.edu.au>
# URL: <http://www.nltk.org/>
# For license information, see LICENSE.TXT
from StringIO import StringIO
def read_olac(xml):
"""
Read an OLAC XML record and return a list of attributes.
@param xml: XML string for conversion
@type xml: C{string}
@rtype: C{list} of C{tuple}
"""
from lxml import etree
root = etree.parse(StringIO(xml)).getroot()
return [(element.tag, element.attrib, element.text) for element in root.getchildren()]
def pprint_olac(xml):
for tag, attrib, text in read_olac(xml):
print "%-12s" % tag + ':',
if text:
print text,
if attrib:
print "(%s=%s)" % (attrib['type'], attrib['code']),
print
def demo():
from lxml import etree
import nltk.data
file = nltk.data.find('corpora/treebank/olac.xml')
xml = open(file).read()
pprint_olac(xml)
if __name__ == '__main__':
demo()
__all__ = ['read_olac', 'pprint_olac']
|