diff --git a/src/torchaudio/datasets/commonvoice.py b/src/torchaudio/datasets/commonvoice.py index db0e035c61..e0e8dfd47a 100644 --- a/src/torchaudio/datasets/commonvoice.py +++ b/src/torchaudio/datasets/commonvoice.py @@ -49,7 +49,7 @@ def __init__(self, root: Union[str, Path], tsv: str = "train.tsv") -> None: self._path = os.fspath(root) self._tsv = os.path.join(self._path, tsv) - with open(self._tsv, "r") as tsv_: + with open(self._tsv, "r", encoding="utf-8") as tsv_: walker = csv.reader(tsv_, delimiter="\t") self._header = next(walker) self._walker = list(walker)