From 4e0a34afe7d56682627c3bbe37ae35ee3363c75e Mon Sep 17 00:00:00 2001 From: Gabriel Dunne Date: Fri, 22 Mar 2013 22:29:51 -0700 Subject: [PATCH] Renamed Parse-Search --- parse_search-xml.py | 36 ++++++++++++++++++++++++++++++++++++ 1 file changed, 36 insertions(+) create mode 100644 parse_search-xml.py diff --git a/parse_search-xml.py b/parse_search-xml.py new file mode 100644 index 0000000..e07682c --- /dev/null +++ b/parse_search-xml.py @@ -0,0 +1,36 @@ +import xml.etree.ElementTree as ET +import json +tree = ET.parse('search-lg.xml') +root = tree.getroot() + +data = { "clips" : [] } + +for result in root.iter('doc'): + + c = {} + + for e in result.iter('str'): + if (e.get('name') == "identifier"): + c["id"] = e.text + if (e.get('name') == "description"): + c["description"] = e.text + if (e.get('name') == "title"): + c["title"] = e.text + + for e in result.iter('date'): + if (e.get('name') == "publicdate"): + c["date"] = e.text + + for e in result.iter('date'): + if (e.get('name') == "publicdate"): + c["date"] = e.text + + for e in result.iter('arr'): + if (e.get('name') == "subject"): + c["subject"] = [] + for s in e.iter('str'): + c["subject"].append(s.text) + + data['clips'].append(c) + +print json.dumps(data) -- 2.34.1