Spaces:
Sleeping
Sleeping
| import re | |
| def NER_XML_to_HTML(xml): | |
| html = re.sub(r'WORK_OF_ART','WORKOFART',xml) | |
| # replace every end tag with end span tag "</span>" | |
| html = re.sub(r'</[A-Z]+>','</span>',html) | |
| # replace every start tag with the appropriate css class | |
| html = re.sub(r'<PERS>','<span class="ner_pers" data-entity="PERS">',html) | |
| html = re.sub(r'<GROUP>','<span class="ner_group" data-entity="NORP">',html) | |
| html = re.sub(r'<OCC>','<span class="ner_occ" data-entity="OCC">',html) | |
| html = re.sub(r'<ORG>','<span class="ner_org" data-entity="ORG">',html) | |
| html = re.sub(r'<LOC>','<span class="ner_loc" data-entity="LOC">',html) | |
| html = re.sub(r'<GPE>','<span class="ner_gpe" data-entity="GPE">',html) | |
| html = re.sub(r'<FAC>','<span class="ner_fac" data-entity="FAC">',html) | |
| html = re.sub(r'<EVENT>','<span class="ner_event" data-entity="EVENT">',html) | |
| html = re.sub(r'<DATE>','<span class="ner_date" data-entity="DATE">',html) | |
| html = re.sub(r'<TIME>','<span class="ner_time" data-entity="TIME">',html) | |
| html = re.sub(r'<CARDINAL>','<span class="ner_cardinal" data-entity="CARDINAL">',html) | |
| html = re.sub(r'<ORDINAL>','<span class="ner_ordinal" data-entity="ORDINAL">',html) | |
| html = re.sub(r'<PERCENT>','<span class="ner_percent" data-entity="PERCENT">',html) | |
| html = re.sub(r'<QUANTITY>','<span class="ner_quantity" data-entity="QUANTITY">',html) | |
| html = re.sub(r'<UNIT>','<span class="ner_unit" data-entity="UNIT">',html) | |
| html = re.sub(r'<MONEY>','<span class="ner_money" data-entity="MONEY">',html) | |
| html = re.sub(r'<CURR>','<span class="ner_currency" data-entity="CURRENCY">',html) | |
| html = re.sub(r'<LANGUAGE>','<span class="ner_language" data-entity="LANGUAGE">',html) | |
| html = re.sub(r'<PRODUCT>','<span class="ner_product" data-entity="PRODUCT">',html) | |
| html = re.sub(r'<WORKOFART>','<span class="ner_work_of_art" data-entity="WORK_OF_ART">',html) | |
| html = re.sub(r'<LAW>','<span class="ner_law" data-entity="LAW">',html) | |
| return html |