处理文本数据

# _*_ coding:utf-8 _*_
import re

if __name__ == "__main__":
filename = 'data.txt'
with open(filename,'r',encoding='UTF-8') as file_to_read:
while True:
lines = file_to_read.readline()
sub_lines = lines[6:]
has = sub_lines.find("(")
if has ==-1:
print(sub_lines.strip())
else:
p1 = re.compile(r'(.*?)[(]') # 最小匹配
freezer_kind = re.findall(p1, sub_lines)
print(freezer_kind[0])
if not lines:
break
上海市宝山区士大夫地方
上海市宝山区撒旦发射点(青秀城)
上海市宝山区撒旦发射点士大夫
上海市宝山区士大夫犯得上

猜你喜欢

转载自www.cnblogs.com/gylhaut/p/11609187.html