|
|
@ -3,6 +3,7 @@ |
|
|
import os |
|
|
import os |
|
|
import codecs |
|
|
import codecs |
|
|
from unicodedata import normalize |
|
|
from unicodedata import normalize |
|
|
|
|
|
import re |
|
|
|
|
|
|
|
|
try: |
|
|
try: |
|
|
from lxml import etree |
|
|
from lxml import etree |
|
|
@ -146,3 +147,11 @@ def obter_uf_por_codigo(codigo_uf): |
|
|
|
|
|
|
|
|
def remover_acentos(txt): |
|
|
def remover_acentos(txt): |
|
|
return normalize('NFKD', txt).encode('ASCII','ignore').decode('ASCII') |
|
|
return normalize('NFKD', txt).encode('ASCII','ignore').decode('ASCII') |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def extrai_id_srtxml(edoc): |
|
|
|
|
|
result = '' |
|
|
|
|
|
match = re.search('Id=[^0-9]+(\d+)"', edoc) |
|
|
|
|
|
if match: |
|
|
|
|
|
result = match.group(1) |
|
|
|
|
|
return result |