python提取⽂本中的成语_python如何实现提取⽂本中所有连
续的词语
# !/usr/bin/env python 3
# encoding: utf-8
def split_line(line,n):
if len(line) <=n:
return line
else:
s = ""
for i in range(len(line)-n+1):
s += line[i:i+n]
s += ";"
s += "\n"
return s
if __name__ == '__main__':
# 词组长度
seq_len = 2
# 读取⽂件路径
path = "./"
file = open(path,'r',encoding='utf-8')
# 保存结果路径
result_path = "./"
result_file = open(result_path,'w',encoding='utf-8')
for line in file:
temp = line.strip()
result_file.writelines(split_line(temp,seq_len))
#  关闭⽂件
file.close()
result_file.close()# 我⽤你给的⽂本做了测试;下⾯是输出
单⼀;⼀结;结构;
writelines在python中的用法
象形;形字;
不是;是槌;槌的;的打;打击;
乃是;是⽔;⽔的;的载;载歌;歌载;载舞;
使鹅;鹅卵;卵⽯;⽯臻;臻于;于完;完美;
渐臻;臻佳;佳境;
⽇臻;臻完;完善;
左右;右结;结构;
友谊;谊的;的主;主要;要效;效⽤;⽤之;之⼀;⼀就;就在;在使;使⼈;⼈⼼;⼼中;中的;的愤;愤懑;懑抑;抑郁;郁之;之⽓;⽓得;得以;以宣;宣泄;泄弛;弛放;这些;些不;不平;平之;之⽓;⽓是;是各;各种;种的;的情;情感;感都;都可;可以;以引;引起;起的;