import re
def remove_non_chinese(input_str):
return "".join(re.findall(r'[\u4e00-\u9fa5]', input_str))
sentence = "我爱北京天安门"
rule = "我爱北京.{1,3}"
foundall = re.findall(rule, sentence)
rule_replace_part = remove_non_chinese(rule)
for found in foundall:
print(found.replace(rule_replace_part,""))
print结果:
天安门