We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 3d956d1 commit de4e74eCopy full SHA for de4e74e
1 file changed
src/createtask.py
@@ -14,7 +14,7 @@ def dataset_fn(split, shuffle_files=False):
14
files_to_read=[os.path.join("gs://"+nq_tsv_path["bucket"],str(filename.name)) for filename in client.list_blobs(nq_tsv_path["bucket"], prefix=nq_tsv_path[split])]
15
else:
16
print(os.path.join(nq_tsv_path["bucket"], nq_tsv_path[split]))
17
- files_to_read=[os.path.join(nq_tsv_path["bucket"],str(filename)) for filename in os.listdir(os.path.join(nq_tsv_path["bucket"], nq_tsv_path[split]))]
+ files_to_read=[os.path.join(nq_tsv_path["bucket"],nq_tsv_path[split],str(filename)) for filename in os.listdir(os.path.join(nq_tsv_path["bucket"], nq_tsv_path[split]))]
18
print(len(files_to_read))
19
print(files_to_read[0:10])
20
ds = tf.data.TextLineDataset(files_to_read, compression_type=nq_tsv_path["compression"]).filter(lambda line:tf.not_equal(tf.strings.length(line),0))
0 commit comments