Skip to content

Commit f85700f

Browse files
fix minor error
1 parent 2c389b4 commit f85700f

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

bert_pytorch/dataset/vocab.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -188,12 +188,13 @@ def build():
188188
vocab = WordVocab(f, max_size=args.vocab_size, min_freq=args.min_freq)
189189
elif os.path.isdir(args.corpus_path):
190190
logger.info(f"is dir")
191+
print("get corpus")
191192
texts = []
192193
for index, corpus in tqdm(enumerate(os.listdir(args.corpus_path))):
194+
print("getting {}".format(corpus))
193195
with open(os.path.join(args.corpus_path,corpus), "r", encoding=args.encoding) as f:
194196
texts += f.readlines()
195197
# print(type(f))
196-
break
197198
vocab = WordVocab(texts, max_size=args.vocab_size, min_freq=args.min_freq)
198199
pass
199200
else:

0 commit comments

Comments
 (0)