Skip to content

Commit 07f547b

Browse files
Merge pull request #2544 from iamsdas:desc
PiperOrigin-RevId: 336117107
2 parents 83d38fe + dba0436 commit 07f547b

File tree

3 files changed

+35
-20
lines changed

3 files changed

+35
-20
lines changed

tensorflow_datasets/core/dataset_info.py

Lines changed: 10 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -121,13 +121,19 @@ def __init__(self,
121121
"""
122122
self._builder = builder
123123

124+
if builder.builder_config:
125+
config_name = builder.builder_config.name
126+
config_description = builder.builder_config.description
127+
else:
128+
config_name = None
129+
config_description = None
130+
124131
self._info_proto = dataset_info_pb2.DatasetInfo(
125132
name=builder.name,
126133
description=utils.dedent(description),
127-
version=str(builder._version), # pylint: disable=protected-access
128-
config_name=(
129-
builder.builder_config.name if builder.builder_config else None
130-
),
134+
version=str(builder.version),
135+
config_name=config_name,
136+
config_description=config_description,
131137
citation=utils.dedent(citation),
132138
redistribution_info=dataset_info_pb2.RedistributionInfo(
133139
license=utils.dedent(redistribution_info.pop("license")),

tensorflow_datasets/core/proto/dataset_info.proto

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -61,6 +61,9 @@ message DatasetInfo {
6161
// Config name of the dataset
6262
string config_name = 13;
6363

64+
// Config description of the dataset
65+
string config_description = 14;
66+
6467
// A citation string if one exists for this dataset.
6568
string citation = 3;
6669

@@ -90,5 +93,5 @@ message DatasetInfo {
9093

9194
RedistributionInfo redistribution_info = 11;
9295

93-
// Next available: 14
96+
// Next available: 15
9497
}

tensorflow_datasets/core/proto/dataset_info_generated_pb2.py

Lines changed: 21 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,6 @@
1818
# -*- coding: utf-8 -*-
1919
# Generated by the protocol buffer compiler. DO NOT EDIT!
2020
# source: dataset_info.proto
21-
"""Generated protocol buffer code."""
2221

2322
from google.protobuf import descriptor as _descriptor
2423
from google.protobuf import message as _message
@@ -38,7 +37,7 @@
3837
package='tensorflow_datasets',
3938
syntax='proto3',
4039
serialized_options=b'\370\001\001',
41-
serialized_pb=b'\n\x12\x64\x61taset_info.proto\x12\x13tensorflow_datasets\x1a-tensorflow_metadata/proto/v0/statistics.proto\x1a)tensorflow_metadata/proto/v0/schema.proto\"\x1f\n\x0f\x44\x61tasetLocation\x12\x0c\n\x04urls\x18\x01 \x03(\t\"\x9d\x01\n\tSplitInfo\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x12\n\nnum_shards\x18\x02 \x01(\x03\x12\x15\n\rshard_lengths\x18\x04 \x03(\x03\x12\x11\n\tnum_bytes\x18\x05 \x01(\x03\x12\x44\n\nstatistics\x18\x03 \x01(\x0b\x32\x30.tensorflow.metadata.v0.DatasetFeatureStatistics\"/\n\x0eSupervisedKeys\x12\r\n\x05input\x18\x01 \x01(\t\x12\x0e\n\x06output\x18\x02 \x01(\t\"%\n\x12RedistributionInfo\x12\x0f\n\x07license\x18\x01 \x01(\t\"\xc9\x04\n\x0b\x44\x61tasetInfo\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x13\n\x0b\x64\x65scription\x18\x02 \x01(\t\x12\x0f\n\x07version\x18\t \x01(\t\x12\x13\n\x0b\x63onfig_name\x18\r \x01(\t\x12\x10\n\x08\x63itation\x18\x03 \x01(\t\x12\x19\n\rsize_in_bytes\x18\x04 \x01(\x03\x42\x02\x18\x01\x12\x15\n\rdownload_size\x18\x0c \x01(\x03\x12\x36\n\x08location\x18\x05 \x01(\x0b\x32$.tensorflow_datasets.DatasetLocation\x12W\n\x12\x64ownload_checksums\x18\n \x03(\x0b\x32\x37.tensorflow_datasets.DatasetInfo.DownloadChecksumsEntryB\x02\x18\x01\x12.\n\x06schema\x18\x06 \x01(\x0b\x32\x1e.tensorflow.metadata.v0.Schema\x12.\n\x06splits\x18\x07 \x03(\x0b\x32\x1e.tensorflow_datasets.SplitInfo\x12<\n\x0fsupervised_keys\x18\x08 \x01(\x0b\x32#.tensorflow_datasets.SupervisedKeys\x12\x44\n\x13redistribution_info\x18\x0b \x01(\x0b\x32\'.tensorflow_datasets.RedistributionInfo\x1a\x38\n\x16\x44ownloadChecksumsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\x42\x03\xf8\x01\x01\x62\x06proto3'
40+
serialized_pb=b'\n\x12\x64\x61taset_info.proto\x12\x13tensorflow_datasets\x1a-tensorflow_metadata/proto/v0/statistics.proto\x1a)tensorflow_metadata/proto/v0/schema.proto\"\x1f\n\x0f\x44\x61tasetLocation\x12\x0c\n\x04urls\x18\x01 \x03(\t\"\x9d\x01\n\tSplitInfo\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x12\n\nnum_shards\x18\x02 \x01(\x03\x12\x15\n\rshard_lengths\x18\x04 \x03(\x03\x12\x11\n\tnum_bytes\x18\x05 \x01(\x03\x12\x44\n\nstatistics\x18\x03 \x01(\x0b\x32\x30.tensorflow.metadata.v0.DatasetFeatureStatistics\"/\n\x0eSupervisedKeys\x12\r\n\x05input\x18\x01 \x01(\t\x12\x0e\n\x06output\x18\x02 \x01(\t\"%\n\x12RedistributionInfo\x12\x0f\n\x07license\x18\x01 \x01(\t\"\xe5\x04\n\x0b\x44\x61tasetInfo\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x13\n\x0b\x64\x65scription\x18\x02 \x01(\t\x12\x0f\n\x07version\x18\t \x01(\t\x12\x13\n\x0b\x63onfig_name\x18\r \x01(\t\x12\x1a\n\x12\x63onfig_description\x18\x0e \x01(\t\x12\x10\n\x08\x63itation\x18\x03 \x01(\t\x12\x19\n\rsize_in_bytes\x18\x04 \x01(\x03\x42\x02\x18\x01\x12\x15\n\rdownload_size\x18\x0c \x01(\x03\x12\x36\n\x08location\x18\x05 \x01(\x0b\x32$.tensorflow_datasets.DatasetLocation\x12W\n\x12\x64ownload_checksums\x18\n \x03(\x0b\x32\x37.tensorflow_datasets.DatasetInfo.DownloadChecksumsEntryB\x02\x18\x01\x12.\n\x06schema\x18\x06 \x01(\x0b\x32\x1e.tensorflow.metadata.v0.Schema\x12.\n\x06splits\x18\x07 \x03(\x0b\x32\x1e.tensorflow_datasets.SplitInfo\x12<\n\x0fsupervised_keys\x18\x08 \x01(\x0b\x32#.tensorflow_datasets.SupervisedKeys\x12\x44\n\x13redistribution_info\x18\x0b \x01(\x0b\x32\'.tensorflow_datasets.RedistributionInfo\x1a\x38\n\x16\x44ownloadChecksumsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\x42\x03\xf8\x01\x01\x62\x06proto3'
4241
,
4342
dependencies=[tensorflow__metadata_dot_proto_dot_v0_dot_statistics__pb2.DESCRIPTOR,tensorflow__metadata_dot_proto_dot_v0_dot_schema__pb2.DESCRIPTOR,])
4443

@@ -237,8 +236,8 @@
237236
extension_ranges=[],
238237
oneofs=[
239238
],
240-
serialized_start=944,
241-
serialized_end=1000,
239+
serialized_start=972,
240+
serialized_end=1028,
242241
)
243242

244243
_DATASETINFO = _descriptor.Descriptor(
@@ -277,63 +276,70 @@
277276
is_extension=False, extension_scope=None,
278277
serialized_options=None, file=DESCRIPTOR),
279278
_descriptor.FieldDescriptor(
280-
name='citation', full_name='tensorflow_datasets.DatasetInfo.citation', index=4,
279+
name='config_description', full_name='tensorflow_datasets.DatasetInfo.config_description', index=4,
280+
number=14, type=9, cpp_type=9, label=1,
281+
has_default_value=False, default_value=b"".decode('utf-8'),
282+
message_type=None, enum_type=None, containing_type=None,
283+
is_extension=False, extension_scope=None,
284+
serialized_options=None, file=DESCRIPTOR),
285+
_descriptor.FieldDescriptor(
286+
name='citation', full_name='tensorflow_datasets.DatasetInfo.citation', index=5,
281287
number=3, type=9, cpp_type=9, label=1,
282288
has_default_value=False, default_value=b"".decode('utf-8'),
283289
message_type=None, enum_type=None, containing_type=None,
284290
is_extension=False, extension_scope=None,
285291
serialized_options=None, file=DESCRIPTOR),
286292
_descriptor.FieldDescriptor(
287-
name='size_in_bytes', full_name='tensorflow_datasets.DatasetInfo.size_in_bytes', index=5,
293+
name='size_in_bytes', full_name='tensorflow_datasets.DatasetInfo.size_in_bytes', index=6,
288294
number=4, type=3, cpp_type=2, label=1,
289295
has_default_value=False, default_value=0,
290296
message_type=None, enum_type=None, containing_type=None,
291297
is_extension=False, extension_scope=None,
292298
serialized_options=b'\030\001', file=DESCRIPTOR),
293299
_descriptor.FieldDescriptor(
294-
name='download_size', full_name='tensorflow_datasets.DatasetInfo.download_size', index=6,
300+
name='download_size', full_name='tensorflow_datasets.DatasetInfo.download_size', index=7,
295301
number=12, type=3, cpp_type=2, label=1,
296302
has_default_value=False, default_value=0,
297303
message_type=None, enum_type=None, containing_type=None,
298304
is_extension=False, extension_scope=None,
299305
serialized_options=None, file=DESCRIPTOR),
300306
_descriptor.FieldDescriptor(
301-
name='location', full_name='tensorflow_datasets.DatasetInfo.location', index=7,
307+
name='location', full_name='tensorflow_datasets.DatasetInfo.location', index=8,
302308
number=5, type=11, cpp_type=10, label=1,
303309
has_default_value=False, default_value=None,
304310
message_type=None, enum_type=None, containing_type=None,
305311
is_extension=False, extension_scope=None,
306312
serialized_options=None, file=DESCRIPTOR),
307313
_descriptor.FieldDescriptor(
308-
name='download_checksums', full_name='tensorflow_datasets.DatasetInfo.download_checksums', index=8,
314+
name='download_checksums', full_name='tensorflow_datasets.DatasetInfo.download_checksums', index=9,
309315
number=10, type=11, cpp_type=10, label=3,
310316
has_default_value=False, default_value=[],
311317
message_type=None, enum_type=None, containing_type=None,
312318
is_extension=False, extension_scope=None,
313319
serialized_options=b'\030\001', file=DESCRIPTOR),
314320
_descriptor.FieldDescriptor(
315-
name='schema', full_name='tensorflow_datasets.DatasetInfo.schema', index=9,
321+
name='schema', full_name='tensorflow_datasets.DatasetInfo.schema', index=10,
316322
number=6, type=11, cpp_type=10, label=1,
317323
has_default_value=False, default_value=None,
318324
message_type=None, enum_type=None, containing_type=None,
319325
is_extension=False, extension_scope=None,
320326
serialized_options=None, file=DESCRIPTOR),
321327
_descriptor.FieldDescriptor(
322-
name='splits', full_name='tensorflow_datasets.DatasetInfo.splits', index=10,
328+
name='splits', full_name='tensorflow_datasets.DatasetInfo.splits', index=11,
323329
number=7, type=11, cpp_type=10, label=3,
324330
has_default_value=False, default_value=[],
325331
message_type=None, enum_type=None, containing_type=None,
326332
is_extension=False, extension_scope=None,
327333
serialized_options=None, file=DESCRIPTOR),
328334
_descriptor.FieldDescriptor(
329-
name='supervised_keys', full_name='tensorflow_datasets.DatasetInfo.supervised_keys', index=11,
335+
name='supervised_keys', full_name='tensorflow_datasets.DatasetInfo.supervised_keys', index=12,
330336
number=8, type=11, cpp_type=10, label=1,
331337
has_default_value=False, default_value=None,
332338
message_type=None, enum_type=None, containing_type=None,
333339
is_extension=False, extension_scope=None,
334340
serialized_options=None, file=DESCRIPTOR),
335341
_descriptor.FieldDescriptor(
336-
name='redistribution_info', full_name='tensorflow_datasets.DatasetInfo.redistribution_info', index=12,
342+
name='redistribution_info', full_name='tensorflow_datasets.DatasetInfo.redistribution_info', index=13,
337343
number=11, type=11, cpp_type=10, label=1,
338344
has_default_value=False, default_value=None,
339345
message_type=None, enum_type=None, containing_type=None,
@@ -352,7 +358,7 @@
352358
oneofs=[
353359
],
354360
serialized_start=415,
355-
serialized_end=1000,
361+
serialized_end=1028,
356362
)
357363

358364
_SPLITINFO.fields_by_name['statistics'].message_type = tensorflow__metadata_dot_proto_dot_v0_dot_statistics__pb2._DATASETFEATURESTATISTICS
@@ -418,4 +424,4 @@
418424
_DATASETINFO_DOWNLOADCHECKSUMSENTRY._options = None
419425
_DATASETINFO.fields_by_name['size_in_bytes']._options = None
420426
_DATASETINFO.fields_by_name['download_checksums']._options = None
421-
# @@protoc_insertion_point(module_scope)
427+
# @@protoc_insertion_point(module_scope)

0 commit comments

Comments
 (0)