Files
roauthorship/src/ttl/ttlservice.py
2017-05-23 13:57:53 +03:00

35 lines
1.2 KiB
Python

# coding: utf-8
import zeep
def executeTtl(text):
# Preprocess the text
text = text.replace(u'ĭ', 'i')
text = text.replace(u'ŭ', 'u')
text = text.replace(u'à', 'a')
client = zeep.Client("http://ws.racai.ro/ttlws.wsdl")
textSgml = client.service.UTF8toSGML(text)
result = client.service.XCES("ro", "id", textSgml)
# Cleanup result - generate valid xml
result = result.replace('’', '`')
result = result.replace('ă', u'ă')
result = result.replace('à', u'à')
result = result.replace('â', u'â')
result = result.replace('î', u'î')
result = result.replace('ş', u'ș')
result = result.replace('ţ', u'ț')
result = result.replace('ŭ', u'u')
result = result.replace('Ă', u'Ă')
result = result.replace('À', u'À')
result = result.replace('Â', u'Â')
result = result.replace('Î', u'Î')
result = result.replace('Ş', u'Ș')
result = result.replace('Ţ', u'Ț')
result = result.replace('Ŭ', u'U')
xmlResult = "<?xml version=\"1.0\" encoding=\"utf-8\" ?><segs>"
xmlResult += result
xmlResult += "</segs>"
return xmlResult