Skip to content

Commit 2b195ad

Browse files
committed
Updating TorchData DataPipe API usages
1 parent f8ce695 commit 2b195ad

17 files changed

+20
-20
lines changed

torchtext/datasets/amazonreviewfull.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -70,7 +70,7 @@ def AmazonReviewFull(root: str, split: Union[Tuple[str], str]):
7070
filepath_fn=lambda x: os.path.join(root, _EXTRACTED_FILES[split])
7171
)
7272
cache_decompressed_dp = (
73-
FileOpener(cache_decompressed_dp, mode="b").read_from_tar().filter(lambda x: _EXTRACTED_FILES[split] in x[0])
73+
FileOpener(cache_decompressed_dp, mode="b").load_from_tar().filter(lambda x: _EXTRACTED_FILES[split] in x[0])
7474
)
7575
cache_decompressed_dp = cache_decompressed_dp.end_caching(mode="wb", same_filepath_fn=True)
7676

torchtext/datasets/amazonreviewpolarity.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -67,7 +67,7 @@ def AmazonReviewPolarity(root: str, split: Union[Tuple[str], str]):
6767
filepath_fn=lambda x: os.path.join(root, _EXTRACTED_FILES[split])
6868
)
6969
cache_decompressed_dp = (
70-
FileOpener(cache_decompressed_dp, mode="b").read_from_tar().filter(lambda x: _EXTRACTED_FILES[split] in x[0])
70+
FileOpener(cache_decompressed_dp, mode="b").load_from_tar().filter(lambda x: _EXTRACTED_FILES[split] in x[0])
7171
)
7272
cache_decompressed_dp = cache_decompressed_dp.end_caching(mode="wb", same_filepath_fn=True)
7373

torchtext/datasets/cc100.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -161,7 +161,7 @@ def CC100(root: str, language_code: str = "en"):
161161
cache_decompressed_dp = cache_compressed_dp.on_disk_cache(
162162
filepath_fn=lambda x: os.path.join(root, os.path.basename(x).rstrip(".xz"))
163163
)
164-
cache_decompressed_dp = FileOpener(cache_decompressed_dp, mode="b").read_from_xz()
164+
cache_decompressed_dp = FileOpener(cache_decompressed_dp, mode="b").load_from_xz()
165165
cache_decompressed_dp = cache_decompressed_dp.end_caching(mode="wb")
166166

167167
data_dp = FileOpener(cache_decompressed_dp, encoding="utf-8").readlines(return_path=False)

torchtext/datasets/dbpedia.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -66,7 +66,7 @@ def DBpedia(root: str, split: Union[Tuple[str], str]):
6666
filepath_fn=lambda x: os.path.join(root, _EXTRACTED_FILES[split])
6767
)
6868
cache_decompressed_dp = (
69-
FileOpener(cache_decompressed_dp, mode="b").read_from_tar().filter(lambda x: _EXTRACTED_FILES[split] in x[0])
69+
FileOpener(cache_decompressed_dp, mode="b").load_from_tar().filter(lambda x: _EXTRACTED_FILES[split] in x[0])
7070
)
7171
cache_decompressed_dp = cache_decompressed_dp.end_caching(mode="wb", same_filepath_fn=True)
7272

torchtext/datasets/enwik9.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -48,7 +48,7 @@ def EnWik9(root: str):
4848
cache_decompressed_dp = cache_compressed_dp.on_disk_cache(
4949
filepath_fn=lambda x: os.path.join(root, os.path.splitext(_PATH)[0])
5050
)
51-
cache_decompressed_dp = FileOpener(cache_decompressed_dp, mode="b").read_from_zip()
51+
cache_decompressed_dp = FileOpener(cache_decompressed_dp, mode="b").load_from_zip()
5252
cache_decompressed_dp = cache_decompressed_dp.end_caching(mode="wb", same_filepath_fn=True)
5353

5454
data_dp = FileOpener(cache_decompressed_dp, encoding="utf-8")

torchtext/datasets/imdb.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -62,7 +62,7 @@ def IMDB(root: str, split: Union[Tuple[str], str]):
6262
filepath_fn=lambda x: [os.path.join(root, decompressed_folder, split, label) for label in labels]
6363
)
6464
cache_decompressed_dp = FileOpener(cache_decompressed_dp, mode="b")
65-
cache_decompressed_dp = cache_decompressed_dp.read_from_tar()
65+
cache_decompressed_dp = cache_decompressed_dp.load_from_tar()
6666

6767
def filter_imdb_data(key, fname):
6868
# eg. fname = "aclImdb/train/neg/12416_3.txt"

torchtext/datasets/iwslt2016.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -125,7 +125,7 @@
125125
# avoid additional conditional imports.
126126
def _filter_clean_cache(cache_decompressed_dp, full_filepath, uncleaned_filename):
127127
cache_inner_decompressed_dp = cache_decompressed_dp.on_disk_cache(filepath_fn=lambda x: full_filepath)
128-
cache_inner_decompressed_dp = FileOpener(cache_inner_decompressed_dp, mode="b").read_from_tar()
128+
cache_inner_decompressed_dp = FileOpener(cache_inner_decompressed_dp, mode="b").load_from_tar()
129129
cache_inner_decompressed_dp = cache_inner_decompressed_dp.filter(
130130
lambda x: os.path.basename(uncleaned_filename) in x[0]
131131
)
@@ -263,7 +263,7 @@ def IWSLT2016(
263263
cache_decompressed_dp = cache_compressed_dp.on_disk_cache(filepath_fn=lambda x: inner_iwslt_tar)
264264
cache_decompressed_dp = (
265265
FileOpener(cache_decompressed_dp, mode="b")
266-
.read_from_tar()
266+
.load_from_tar()
267267
.filter(lambda x: os.path.basename(inner_iwslt_tar) in x[0])
268268
)
269269
cache_decompressed_dp = cache_decompressed_dp.end_caching(mode="wb", same_filepath_fn=True)

torchtext/datasets/iwslt2017.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -104,7 +104,7 @@
104104
# avoid additional conditional imports.
105105
def _filter_clean_cache(cache_decompressed_dp, full_filepath, uncleaned_filename):
106106
cache_inner_decompressed_dp = cache_decompressed_dp.on_disk_cache(filepath_fn=lambda x: full_filepath)
107-
cache_inner_decompressed_dp = FileOpener(cache_inner_decompressed_dp, mode="b").read_from_tar()
107+
cache_inner_decompressed_dp = FileOpener(cache_inner_decompressed_dp, mode="b").load_from_tar()
108108
cache_inner_decompressed_dp = cache_inner_decompressed_dp.filter(
109109
lambda x: os.path.basename(uncleaned_filename) in x[0]
110110
)
@@ -208,7 +208,7 @@ def IWSLT2017(root=".data", split=("train", "valid", "test"), language_pair=("de
208208
)
209209

210210
cache_decompressed_dp = cache_compressed_dp.on_disk_cache(filepath_fn=lambda x: inner_iwslt_tar)
211-
cache_decompressed_dp = FileOpener(cache_decompressed_dp, mode="b").read_from_tar()
211+
cache_decompressed_dp = FileOpener(cache_decompressed_dp, mode="b").load_from_tar()
212212
cache_decompressed_dp = cache_decompressed_dp.end_caching(mode="wb", same_filepath_fn=True)
213213

214214
src_filename = file_path_by_lang_and_split[src_language][split]

torchtext/datasets/multi30k.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -84,7 +84,7 @@ def Multi30k(root: str, split: Union[Tuple[str], str], language_pair: Tuple[str]
8484
)
8585
src_cache_decompressed_dp = (
8686
FileOpener(src_cache_decompressed_dp, mode="b")
87-
.read_from_tar()
87+
.load_from_tar()
8888
.filter(lambda x: f"{_PREFIX[split]}.{language_pair[0]}" in x[0])
8989
)
9090
src_cache_decompressed_dp = src_cache_decompressed_dp.end_caching(mode="wb", same_filepath_fn=True)
@@ -94,7 +94,7 @@ def Multi30k(root: str, split: Union[Tuple[str], str], language_pair: Tuple[str]
9494
)
9595
tgt_cache_decompressed_dp = (
9696
FileOpener(tgt_cache_decompressed_dp, mode="b")
97-
.read_from_tar()
97+
.load_from_tar()
9898
.filter(lambda x: f"{_PREFIX[split]}.{language_pair[1]}" in x[0])
9999
)
100100
tgt_cache_decompressed_dp = tgt_cache_decompressed_dp.end_caching(mode="wb", same_filepath_fn=True)

torchtext/datasets/sogounews.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -70,7 +70,7 @@ def SogouNews(root: str, split: Union[Tuple[str], str]):
7070
filepath_fn=lambda x: os.path.join(root, _EXTRACTED_FILES[split])
7171
)
7272
cache_decompressed_dp = (
73-
FileOpener(cache_decompressed_dp, mode="b").read_from_tar().filter(lambda x: _EXTRACTED_FILES[split] in x[0])
73+
FileOpener(cache_decompressed_dp, mode="b").load_from_tar().filter(lambda x: _EXTRACTED_FILES[split] in x[0])
7474
)
7575
cache_decompressed_dp = cache_decompressed_dp.end_caching(mode="wb", same_filepath_fn=True)
7676

torchtext/datasets/sst2.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -73,7 +73,7 @@ def SST2(root, split):
7373
filepath_fn=lambda x: os.path.join(root, _EXTRACTED_FILES[split])
7474
)
7575
cache_decompressed_dp = (
76-
FileOpener(cache_decompressed_dp, mode="b").read_from_zip().filter(lambda x: _EXTRACTED_FILES[split] in x[0])
76+
FileOpener(cache_decompressed_dp, mode="b").load_from_zip().filter(lambda x: _EXTRACTED_FILES[split] in x[0])
7777
)
7878
cache_decompressed_dp = cache_decompressed_dp.end_caching(mode="wb", same_filepath_fn=True)
7979

torchtext/datasets/udpos.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -61,7 +61,7 @@ def UDPOS(root: str, split: Union[Tuple[str], str]):
6161
filepath_fn=lambda x: os.path.join(root, _EXTRACTED_FILES[split])
6262
)
6363
cache_decompressed_dp = (
64-
FileOpener(cache_decompressed_dp, mode="b").read_from_zip().filter(lambda x: _EXTRACTED_FILES[split] in x[0])
64+
FileOpener(cache_decompressed_dp, mode="b").load_from_zip().filter(lambda x: _EXTRACTED_FILES[split] in x[0])
6565
)
6666
cache_decompressed_dp = cache_decompressed_dp.end_caching(mode="wb", same_filepath_fn=True)
6767

torchtext/datasets/wikitext103.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -66,7 +66,7 @@ def WikiText103(root: str, split: Union[Tuple[str], str]):
6666
)
6767
# Extract zip and filter the appropriate split file
6868
cache_decompressed_dp = (
69-
FileOpener(cache_decompressed_dp, mode="b").read_from_zip().filter(lambda x: _EXTRACTED_FILES[split] in x[0])
69+
FileOpener(cache_decompressed_dp, mode="b").load_from_zip().filter(lambda x: _EXTRACTED_FILES[split] in x[0])
7070
)
7171
cache_decompressed_dp = cache_decompressed_dp.end_caching(mode="wb", same_filepath_fn=True)
7272
data_dp = FileOpener(cache_decompressed_dp, encoding="utf-8")

torchtext/datasets/wikitext2.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -66,7 +66,7 @@ def WikiText2(root: str, split: Union[Tuple[str], str]):
6666
)
6767
# Extract zip and filter the appropriate split file
6868
cache_decompressed_dp = (
69-
FileOpener(cache_decompressed_dp, mode="b").read_from_zip().filter(lambda x: _EXTRACTED_FILES[split] in x[0])
69+
FileOpener(cache_decompressed_dp, mode="b").load_from_zip().filter(lambda x: _EXTRACTED_FILES[split] in x[0])
7070
)
7171
cache_decompressed_dp = cache_decompressed_dp.end_caching(mode="wb", same_filepath_fn=True)
7272
data_dp = FileOpener(cache_decompressed_dp, encoding="utf-8")

torchtext/datasets/yahooanswers.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -67,7 +67,7 @@ def YahooAnswers(root: str, split: Union[Tuple[str], str]):
6767
filepath_fn=lambda x: os.path.join(root, _EXTRACTED_FILES[split])
6868
)
6969
cache_decompressed_dp = FileOpener(cache_decompressed_dp, mode="b")
70-
cache_decompressed_dp = cache_decompressed_dp.read_from_tar()
70+
cache_decompressed_dp = cache_decompressed_dp.load_from_tar()
7171
cache_decompressed_dp = cache_decompressed_dp.filter(lambda x: _EXTRACTED_FILES[split] in x[0])
7272
cache_decompressed_dp = cache_decompressed_dp.end_caching(mode="wb", same_filepath_fn=True)
7373

torchtext/datasets/yelpreviewfull.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -67,7 +67,7 @@ def YelpReviewFull(root: str, split: Union[Tuple[str], str]):
6767
filepath_fn=lambda x: os.path.join(root, _EXTRACTED_FILES[split])
6868
)
6969
cache_decompressed_dp = FileOpener(cache_decompressed_dp, mode="b")
70-
cache_decompressed_dp = cache_decompressed_dp.read_from_tar().filter(lambda x: _EXTRACTED_FILES[split] in x[0])
70+
cache_decompressed_dp = cache_decompressed_dp.load_from_tar().filter(lambda x: _EXTRACTED_FILES[split] in x[0])
7171
cache_decompressed_dp = cache_decompressed_dp.end_caching(mode="wb", same_filepath_fn=True)
7272

7373
data_dp = FileOpener(cache_decompressed_dp, encoding="utf-8")

torchtext/datasets/yelpreviewpolarity.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -67,7 +67,7 @@ def YelpReviewPolarity(root: str, split: Union[Tuple[str], str]):
6767
)
6868
cache_decompressed_dp = FileOpener(cache_decompressed_dp, mode="b")
6969

70-
cache_decompressed_dp = cache_decompressed_dp.read_from_tar()
70+
cache_decompressed_dp = cache_decompressed_dp.load_from_tar()
7171

7272
cache_decompressed_dp = cache_decompressed_dp.filter(lambda x: _EXTRACTED_FILES[split] in x[0])
7373
cache_decompressed_dp = cache_decompressed_dp.end_caching(mode="wb", same_filepath_fn=True)

0 commit comments

Comments
 (0)