-
Notifications
You must be signed in to change notification settings - Fork 135
/
Copy pathprepare_dialog.py
36 lines (31 loc) · 912 Bytes
/
prepare_dialog.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
# -*- coding:utf-8 -*-
'''
@Author: yanwii
@Date: 2018-05-14 14:52:35
'''
import re
import sys
def prepare(num_dialogs=1000):
with open("dialog/xiaohuangji50w_nofenci.conv") as fopen:
reg = re.compile("E\nM (.*?)\nM (.*?)\n")
match_dialogs = re.findall(reg, fopen.read())
if num_dialogs >= len(match_dialogs):
dialogs = match_dialogs
else:
dialogs = match_dialogs[:num_dialogs]
questions = []
answers = []
for que, ans in dialogs:
questions.append(que)
answers.append(ans)
save(questions, "dialog/Q")
save(answers, "dialog/A")
def save(dialogs, file):
with open(file, "w") as fopen:
fopen.write("\n".join(dialogs))
if __name__ == "__main__":
if len(sys.argv) > 1:
num_dialogs = int(sys.argv[1])
prepare(num_dialogs)
else:
prepare()