Skip to content

Commit 4c8eb15

Browse files
Use "nyu-mll/glue" instead of "glue" for encoder datasets to fix 404 error
Signed-off-by: Jeremy Berchtold <jberchtold@nvidia.com>
1 parent 2dbfbc7 commit 4c8eb15

File tree

4 files changed

+8
-8
lines changed

4 files changed

+8
-8
lines changed

examples/jax/encoder/test_model_parallel_encoder.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -219,11 +219,11 @@ def get_datasets(max_seq_len):
219219
vocab = {}
220220
word_id = 0
221221

222-
train_ds = load_dataset("glue", "cola", split="train")
222+
train_ds = load_dataset("nyu-mll/glue", "cola", split="train")
223223
train_ds.set_format(type="np")
224224
train_ds, vocab, word_id = data_preprocess(train_ds, vocab, word_id, max_seq_len)
225225

226-
test_ds = load_dataset("glue", "cola", split="validation")
226+
test_ds = load_dataset("nyu-mll/glue", "cola", split="validation")
227227
test_ds.set_format(type="np")
228228
test_ds, vocab, word_id = data_preprocess(test_ds, vocab, word_id, max_seq_len)
229229
return train_ds, test_ds, word_id

examples/jax/encoder/test_multigpu_encoder.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -197,11 +197,11 @@ def get_datasets(max_seq_len):
197197
vocab = {}
198198
word_id = 0
199199

200-
train_ds = load_dataset("glue", "cola", split="train")
200+
train_ds = load_dataset("nyu-mll/glue", "cola", split="train")
201201
train_ds.set_format(type="np")
202202
train_ds, vocab, word_id = data_preprocess(train_ds, vocab, word_id, max_seq_len)
203203

204-
test_ds = load_dataset("glue", "cola", split="validation")
204+
test_ds = load_dataset("nyu-mll/glue", "cola", split="validation")
205205
test_ds.set_format(type="np")
206206
test_ds, vocab, word_id = data_preprocess(test_ds, vocab, word_id, max_seq_len)
207207
return train_ds, test_ds, word_id

examples/jax/encoder/test_multiprocessing_encoder.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -307,11 +307,11 @@ def get_datasets(max_seq_len):
307307
vocab = {}
308308
word_id = 0
309309

310-
train_ds = load_dataset("glue", "cola", split="train")
310+
train_ds = load_dataset("nyu-mll/glue", "cola", split="train")
311311
train_ds.set_format(type="np")
312312
train_ds, vocab, word_id = data_preprocess(train_ds, vocab, word_id, max_seq_len)
313313

314-
test_ds = load_dataset("glue", "cola", split="validation")
314+
test_ds = load_dataset("nyu-mll/glue", "cola", split="validation")
315315
test_ds.set_format(type="np")
316316
test_ds, vocab, word_id = data_preprocess(test_ds, vocab, word_id, max_seq_len)
317317
return train_ds, test_ds, word_id

examples/jax/encoder/test_single_gpu_encoder.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -195,11 +195,11 @@ def get_datasets(max_seq_len):
195195
vocab = {}
196196
word_id = 0
197197

198-
train_ds = load_dataset("glue", "cola", split="train")
198+
train_ds = load_dataset("nyu-mll/glue", "cola", split="train")
199199
train_ds.set_format(type="np")
200200
train_ds, vocab, word_id = data_preprocess(train_ds, vocab, word_id, max_seq_len)
201201

202-
test_ds = load_dataset("glue", "cola", split="validation")
202+
test_ds = load_dataset("nyu-mll/glue", "cola", split="validation")
203203
test_ds.set_format(type="np")
204204
test_ds, vocab, word_id = data_preprocess(test_ds, vocab, word_id, max_seq_len)
205205
return train_ds, test_ds, word_id

0 commit comments

Comments
 (0)