From 2fe442cce5ddeeddf66958ee42a9d2d244d1a39e Mon Sep 17 00:00:00 2001 From: zhang Date: Sun, 23 Oct 2022 11:39:29 +0800 Subject: update --- misc/process.py | 29 +++++++++++++++++++++++++++++ 1 file changed, 29 insertions(+) create mode 100644 misc/process.py (limited to 'misc/process.py') diff --git a/misc/process.py b/misc/process.py new file mode 100644 index 0000000..e613615 --- /dev/null +++ b/misc/process.py @@ -0,0 +1,29 @@ + +from datetime import datetime + +def merge(): + chinese = open('./raw_chinese.txt', encoding='UTF-8').readlines() + english = open('./raw_english.txt', encoding='UTF-8').readlines() + merge = open('./merge_{}.txt'.format(today), 'w', encoding='UTF-8') + for c_row, e_row in zip(chinese, english): + c_row = c_row.replace(',', ' ').replace(',', ' ') + merge.write(' '.join(c_row.split()) + '\n') + # e_row = e_row.replace(',', ' ').replace(',', ' ') + merge.write(e_row) + +def split(): + merge = open('./merge_{}.txt'.format(today), encoding='utf-8').readlines() + chinese = open('./chinese_{}.txt'.format(today), 'w', encoding='utf-8') + english = open('./english_{}.txt'.format(today), 'w', encoding='utf-8') + for i, row in enumerate(merge): + if i % 2 == 0: + chinese.write(row) + else: + english.write(row) + +if __name__ == '__main__': + today = datetime.now().strftime('%Y%m%d') + # merge() + split() + pass + -- cgit v1.2.3