mirror of
https://github.com/karl0ss/comfy_fm24_newgens.git
synced 2025-04-28 20:03:40 +01:00
34 lines
1.2 KiB
Python
34 lines
1.2 KiB
Python
import re
|
|
|
|
|
|
class RTF_Parser:
|
|
def __init__(self):
|
|
pass
|
|
|
|
def parse_rtf(self, path):
|
|
UID_regex = re.compile('([0-9]){4,}')
|
|
result_data = []
|
|
rtf = open(path, 'r', encoding="UTF-8")
|
|
# self.logger.info(rtf)
|
|
rtf_data = []
|
|
for line in rtf:
|
|
if UID_regex.search(line):
|
|
# self.logger.info(line.strip())
|
|
rtf_data.append(line.strip())
|
|
for newgen in rtf_data:
|
|
data_fields = newgen.split('|')
|
|
sec_nat = data_fields[3].strip()
|
|
if sec_nat == '':
|
|
sec_nat = None
|
|
result_data.append([data_fields[1].strip(), data_fields[2].strip(), sec_nat, data_fields[5].strip(),data_fields[6].strip(),data_fields[7].strip(),data_fields[8].strip(),data_fields[9].strip(), data_fields[4].strip()])
|
|
rtf.close()
|
|
return result_data
|
|
|
|
def is_rtf_valid(self, path):
|
|
rtf_regex = re.compile('(\|\s*[0-9]{8,}\s*)(\|\s*([A-Z]{3})*\s*)+(\|[\s*\w*\.*\-*]+)(\|[\s*\d+]+){3}\|')
|
|
rtf = open(path, 'r', encoding="UTF-8")
|
|
rtf_data = rtf.read()
|
|
rtf.close()
|
|
if rtf_regex.search(rtf_data):
|
|
return True
|
|
return False |