PapyriBot / formatear_achivos-transfo.py
delarosajav95's picture
Upload 9 files
05c431f verified
import os
import re
corpus = 'training_texts/DDB_EpiDoc_XML/'
path_list = []
for root, dirs, files in os.walk(corpus):
if len(files)>0:
#print(root)
path_list.append(root)
for p in path_list:
froot = p +'/'
for f in os.listdir(p):
fin = froot+f
fout = re.sub('xml$', 'txt', fin)
print(fout)
os.rename(fin, fout)