summaryrefslogtreecommitdiff
path: root/readers/xml_reader.py
diff options
context:
space:
mode:
authorroy lewin <roy.lewin@gmail.com>2016-09-25 19:15:46 +0300
committerroy lewin <tzafrir@cohens.org.il>2016-09-25 19:16:48 +0300
commit41125eb195324d18d9c2c12aa12ecbf66dc5d495 (patch)
tree82fbe719ef68f366b5f603487054b8f3f8fefd23 /readers/xml_reader.py
parenta59d8c977eac3eb5c71870815730e4c9bf35bad2 (diff)
WIP: merge changes not previously merged
(Commit done by Tzafrir)
Diffstat (limited to 'readers/xml_reader.py')
-rw-r--r--readers/xml_reader.py17
1 files changed, 10 insertions, 7 deletions
diff --git a/readers/xml_reader.py b/readers/xml_reader.py
index af80e25..5b2d1fd 100644
--- a/readers/xml_reader.py
+++ b/readers/xml_reader.py
@@ -20,13 +20,13 @@ def read_file(path, element_key):
# get the root element
event, root = context.__next__()
- #the factory
+ # the factory
inl_factory = factories.INLFactory()
files = {}
for event, element in context:
if 'end' in event:
if element_key in element.tag:
- #enter the processing here
+ # enter the processing here
record_counter += 1
#cleaned element is a tree
@@ -34,7 +34,7 @@ def read_file(path, element_key):
cleaned_element = inl_parser.clearxml()
entity = inl_factory.get_entity(cleaned_element)
- #test print the entity
+ # test print the entity
if entity != None:
if entity.TYPE not in files:
files[entity.TYPE] = open("../out/{}.csv".format(entity.TYPE), 'w+', encoding='utf8')
@@ -47,12 +47,15 @@ def read_file(path, element_key):
# entity.print_entity()
-
- #TODO analys and upload the entity
+ # TODO analys and upload the entity
# import pdb; pdb.set_trace()
- #print(record_counter, cleaned_element.getroot().tag, '@@@', cleaned_element.getroot().attrib, '@@@', cleaned_element.getroot().text)
+ print(record_counter, cleaned_element.getroot().tag, '@@@', cleaned_element.getroot().attrib, '@@@',
+ cleaned_element.getroot().text)
element.clear()
+ print(record_counter)
+
+
if __name__ == '__main__':
- read_file(r"C:/Users/Ilsar/Documents/datahack/NLI-nnl10.xml", 'record')
+ read_file(r"../../NLI-nnl10.xml", 'record')