Skip to content

Commit 2f43983

Browse files
author
Guanheng Zhang
committed
Fix ascii decode error
1 parent 5d7e194 commit 2f43983

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

beginner_source/torchtext_translation_tutorial.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -69,7 +69,8 @@ def build_vocab(filepath, tokenizer):
6969
en_vocab = build_vocab(train_filepaths[1], en_tokenizer)
7070

7171
def data_process(filepaths):
72-
raw_de_iter, raw_en_iter = iter(io.open(filepaths[0])), iter(io.open(filepaths[1]))
72+
raw_de_iter = iter(io.open(filepaths[0], encoding="utf8"))
73+
raw_en_iter = iter(io.open(filepaths[1], encoding="utf8"))
7374
data = []
7475
for (raw_de, raw_en) in zip(raw_de_iter, raw_en_iter):
7576
de_tensor_ = torch.tensor([de_vocab[token] for token in de_tokenizer(raw_de)],

0 commit comments

Comments
 (0)