Skip to content

Commit 8e64e46

Browse files
author
The TensorFlow Datasets Authors
committed
add split to dataset reference
PiperOrigin-RevId: 642547838
1 parent d27cdb1 commit 8e64e46

File tree

2 files changed

+15
-8
lines changed

2 files changed

+15
-8
lines changed

tensorflow_datasets/core/proto/dataset_info.proto

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -154,6 +154,12 @@ message TfdsDatasetReference {
154154
// The namespace of the dataset, e.g. huggingface. Note that we prefix by ds_
155155
// to avoid conflicts with reserved in keywords in languages like C++.
156156
string ds_namespace = 5;
157+
158+
// The split of the dataset. Since the dataset reference is used to refer to
159+
// the dataset as a whole, this is usually an empty string, but it can be
160+
// set to a specific split if the dataset reference is used to refer to a
161+
// specific split.
162+
string split = 6;
157163
}
158164

159165
// This is a serialization of tensorflow_datasets.core.DatasetInfo.

tensorflow_datasets/core/proto/dataset_info_generated_pb2.py

Lines changed: 9 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -61,11 +61,12 @@
6161
b' \x01(\t"$\n\x03Url\x12\x0b\n\x03url\x18\x01'
6262
b' \x01(\t\x12\x10\n\x08\x63hecksum\x18\x02'
6363
b' \x01(\t"\x1d\n\x08SqlQuery\x12\x11\n\tsql_query\x18\x01'
64-
b' \x01(\t"m\n\x14TfdsDatasetReference\x12\x0c\n\x04name\x18\x01'
64+
b' \x01(\t"|\n\x14TfdsDatasetReference\x12\x0c\n\x04name\x18\x01'
6565
b' \x01(\t\x12\x0e\n\x06\x63onfig\x18\x02'
6666
b' \x01(\t\x12\x0f\n\x07version\x18\x03'
6767
b' \x01(\t\x12\x10\n\x08\x64\x61ta_dir\x18\x04'
6868
b' \x01(\t\x12\x14\n\x0c\x64s_namespace\x18\x05'
69+
b' \x01(\t\x12\r\n\x05split\x18\x06'
6970
b' \x01(\t"\xb4\x07\n\x0b\x44\x61tasetInfo\x12\x0c\n\x04name\x18\x01'
7071
b' \x01(\t\x12\x13\n\x0b\x64\x65scription\x18\x02'
7172
b' \x01(\t\x12\x0f\n\x07version\x18\t \x01(\t\x12I\n\rrelease_notes\x18\x12'
@@ -142,11 +143,11 @@
142143
_SQLQUERY._serialized_start = 1249
143144
_SQLQUERY._serialized_end = 1278
144145
_TFDSDATASETREFERENCE._serialized_start = 1280
145-
_TFDSDATASETREFERENCE._serialized_end = 1389
146-
_DATASETINFO._serialized_start = 1392
147-
_DATASETINFO._serialized_end = 2340
148-
_DATASETINFO_RELEASENOTESENTRY._serialized_start = 2231
149-
_DATASETINFO_RELEASENOTESENTRY._serialized_end = 2282
150-
_DATASETINFO_DOWNLOADCHECKSUMSENTRY._serialized_start = 2284
151-
_DATASETINFO_DOWNLOADCHECKSUMSENTRY._serialized_end = 2340
146+
_TFDSDATASETREFERENCE._serialized_end = 1404
147+
_DATASETINFO._serialized_start = 1407
148+
_DATASETINFO._serialized_end = 2355
149+
_DATASETINFO_RELEASENOTESENTRY._serialized_start = 2246
150+
_DATASETINFO_RELEASENOTESENTRY._serialized_end = 2297
151+
_DATASETINFO_DOWNLOADCHECKSUMSENTRY._serialized_start = 2299
152+
_DATASETINFO_DOWNLOADCHECKSUMSENTRY._serialized_end = 2355
152153
# @@protoc_insertion_point(module_scope)

0 commit comments

Comments
 (0)