diff --git a/torchtext/datasets/penntreebank.py b/torchtext/datasets/penntreebank.py index 06d1f0401f..602a9477b7 100644 --- a/torchtext/datasets/penntreebank.py +++ b/torchtext/datasets/penntreebank.py @@ -50,4 +50,4 @@ def PennTreebank(root, split: Union[Tuple[str], str]): cache_dp = HttpReader(cache_dp).end_caching(mode="wb", same_filepath_fn=True) data_dp = FileOpener(cache_dp, mode="r") # remove single leading and trailing space from the dataset - return data_dp.readlines(return_path=False).map(lambda t: t.strip()) + return data_dp.readlines(return_path=False, strip_newline=False)