Fixed a bug in the RFC Index parsing that caused extraction of only one paragraph of an abstract, even if there were multiple.
- Legacy-Id: 15820
This commit is contained in:
parent
fbcdcfaf0d
commit
75b0f0dacc
|
@ -28,10 +28,11 @@ MIN_QUEUE_RESULTS = 10
|
|||
MIN_INDEX_RESULTS = 5000
|
||||
|
||||
def get_child_text(parent_node, tag_name):
|
||||
text = []
|
||||
for node in parent_node.childNodes:
|
||||
if node.nodeType == Node.ELEMENT_NODE and node.localName == tag_name:
|
||||
return node.firstChild.data
|
||||
return None
|
||||
text.append(node.firstChild.data)
|
||||
return '\n\n'.join(text)
|
||||
|
||||
|
||||
def fetch_queue_xml(url):
|
||||
|
|
Loading…
Reference in a new issue