1. 程式人生 > >python學習 論語-網路版 處理

python學習 論語-網路版 處理

fi = open("論語-網路版.txt","r",encoding='utf-8')
fo = open("論語-提取版.txt",'w',encoding='utf-8')
txt = fi.readlines()
flag = 0
for line in txt:
    if '【'in line:
        flag = 0
    if '【原文】'in line:
        flag = 1
        continue
    if flag == 1:
        for i in range(25):
            for j in range(25):               
                line = line.replace('{}·{}'.format(i,j),'**')
        for i in range(10):
            line = line.replace('{}*'.format(i),'')
        for i in range(10):
            line = line.replace('*{}'.format(i),'')
        line = line.replace('*','').strip()
        
        fo.write(line+'\n')
        
fi.close()
fo.close()

fi = open("論語-提取版.txt","r",encoding='utf-8')
fo = open("論文-原文.txt","w")
txt = fi.readlines()
for line in txt:
    for i in range(25):
        line = line.replace('({})'.format(i),'')
    fo.write(line)

fi.close()
fo.close()
'''
fi = open("論語-提取版.txt", "r")
fo = open("論語-原文.txt", "w")
for line in fi:   #逐行遍歷
    for i in range(1,23):  #對產生1到22數字 
        line=line.replace("({})".format(i), "")  #構造(i)並替換
    fo.write(line)
fi.close()
fo.close()
'''