This commit is contained in:
loujie0822 2020-08-25 20:00:45 +08:00
parent b7b38d2952
commit 63b1a3eff5
2 changed files with 2 additions and 1 deletions

View File

@ -128,7 +128,7 @@ if __name__ == '__main__':
# print("―", extractor.is_chinese_or_punct("―"))
# print("-", extractor.is_chinese_or_punct("-"))
text_raw = "1%2%ALL患者有Burkitt淋巴瘤的形态学及免疫学特征即FAB形态学分类中的L3型常伴有腹部或其余部位的包块性疾病可以将之视为极晚期Burkitt淋巴瘤对这类患儿应采用晚期Burkitt淋巴瘤的治疗方案。"
text_raw = "3抗甲状腺球蛋白及抗甲状腺微粒体抗体TGA与TPO在桥本甲状腺炎患者血清中高滴度TGA90%95%TPO检测也有相应诊断价值"
sub_text = []
buff = ""

View File

@ -49,6 +49,7 @@ def write_json(obj, path):
encode('utf-8'))
def _read_conll(path, encoding='utf-8', indexes=2, dropna=True):
"""
Construct a generator to read conll items.