wojood-api / XML_to_HTML.py
TymaaHammouda's picture
Update ner service
cfe897e
import re
def NER_XML_to_HTML(xml):
html = re.sub(r'WORK_OF_ART','WORKOFART',xml)
# replace every end tag with end span tag "</span>"
html = re.sub(r'</[A-Z]+>','</span>',html)
# replace every start tag with the appropriate css class
html = re.sub(r'<PERS>','<span class="ner_pers" data-entity="PERS">',html)
html = re.sub(r'<GROUP>','<span class="ner_group" data-entity="NORP">',html)
html = re.sub(r'<OCC>','<span class="ner_occ" data-entity="OCC">',html)
html = re.sub(r'<ORG>','<span class="ner_org" data-entity="ORG">',html)
html = re.sub(r'<LOC>','<span class="ner_loc" data-entity="LOC">',html)
html = re.sub(r'<GPE>','<span class="ner_gpe" data-entity="GPE">',html)
html = re.sub(r'<FAC>','<span class="ner_fac" data-entity="FAC">',html)
html = re.sub(r'<EVENT>','<span class="ner_event" data-entity="EVENT">',html)
html = re.sub(r'<DATE>','<span class="ner_date" data-entity="DATE">',html)
html = re.sub(r'<TIME>','<span class="ner_time" data-entity="TIME">',html)
html = re.sub(r'<CARDINAL>','<span class="ner_cardinal" data-entity="CARDINAL">',html)
html = re.sub(r'<ORDINAL>','<span class="ner_ordinal" data-entity="ORDINAL">',html)
html = re.sub(r'<PERCENT>','<span class="ner_percent" data-entity="PERCENT">',html)
html = re.sub(r'<QUANTITY>','<span class="ner_quantity" data-entity="QUANTITY">',html)
html = re.sub(r'<UNIT>','<span class="ner_unit" data-entity="UNIT">',html)
html = re.sub(r'<MONEY>','<span class="ner_money" data-entity="MONEY">',html)
html = re.sub(r'<CURR>','<span class="ner_currency" data-entity="CURRENCY">',html)
html = re.sub(r'<LANGUAGE>','<span class="ner_language" data-entity="LANGUAGE">',html)
html = re.sub(r'<PRODUCT>','<span class="ner_product" data-entity="PRODUCT">',html)
html = re.sub(r'<WORKOFART>','<span class="ner_work_of_art" data-entity="WORK_OF_ART">',html)
html = re.sub(r'<LAW>','<span class="ner_law" data-entity="LAW">',html)
return html