Skip to content

Commit ab17764

Browse files
iindyktfx-copybara
authored andcommitted
Making RecordBatchToExamplesEncoder consistent with tf.io.parse_example for RaggedFeatures.
Previously, if RT had uniform dimensions, the encoding would be incorrect. PiperOrigin-RevId: 514783895
1 parent fbd7d5f commit ab17764

File tree

2 files changed

+12
-12
lines changed

2 files changed

+12
-12
lines changed

tensorflow_transform/beam/impl_test.py

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -3139,29 +3139,29 @@ def analyzer_fn(inputs):
31393139
'scale_by_min_max$ragged_values': [
31403140
0., 0.285714, 0.428571, 0.142857, 0.285714, 1.
31413141
],
3142-
'scale_by_min_max$row_lengths_1': [0, 4, 0, 2],
3143-
'scale_to_z_score$row_lengths_1': [0, 4, 0, 2],
3142+
'scale_by_min_max$row_lengths_1': [0, 2, 0, 1],
3143+
'scale_to_z_score$row_lengths_1': [0, 2, 0, 1],
31443144
'scale_to_z_score$ragged_values': [
31453145
-1.3333334, -0.22222228, 0.33333328, -0.77777785, -0.22222228,
31463146
2.5555556
31473147
],
3148-
'scale_to_0_1$row_lengths_1': [0, 4, 0, 2],
3148+
'scale_to_0_1$row_lengths_1': [0, 2, 0, 1],
31493149
'scale_to_0_1$ragged_values': [
31503150
0., 0.2857143, 0.42857143, 0.14285715, 0.2857143, 1.
31513151
],
31523152
}, {
31533153
'scale_to_0_1$ragged_values': [
31543154
0.42857143, 0.42857143, 0.14285715, 0.2857143
31553155
],
3156-
'scale_to_0_1$row_lengths_1': [4],
3156+
'scale_to_0_1$row_lengths_1': [2],
31573157
'scale_by_min_max$ragged_values': [
31583158
0.42857143, 0.42857143, 0.14285715, 0.2857143
31593159
],
3160-
'scale_by_min_max$row_lengths_1': [4],
3160+
'scale_by_min_max$row_lengths_1': [2],
31613161
'scale_to_z_score$ragged_values': [
31623162
0.33333328, 0.33333328, -0.77777785, -0.22222228
31633163
],
3164-
'scale_to_z_score$row_lengths_1': [4],
3164+
'scale_to_z_score$row_lengths_1': [2],
31653165
}],
31663166
),
31673167
)
@@ -4544,13 +4544,13 @@ def preprocessing_fn(inputs):
45444544
'x_ones$ragged_values': [1, 1, 1],
45454545
'x_ones$row_lengths_1': [1, 0, 2],
45464546
'y_ones$ragged_values': [1, 1],
4547-
'y_ones$row_lengths_1': [2],
4547+
'y_ones$row_lengths_1': [1],
45484548
},
45494549
{
45504550
'x_ones$ragged_values': [],
45514551
'x_ones$row_lengths_1': [0],
45524552
'y_ones$ragged_values': [1, 1, 1, 1],
4553-
'y_ones$row_lengths_1': [2, 0, 2],
4553+
'y_ones$row_lengths_1': [1, 0, 1],
45544554
},
45554555
]
45564556
expected_metadata = tft.DatasetMetadata.from_feature_spec({

tensorflow_transform/impl_helper_test.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -207,7 +207,7 @@ def _sparse_value_name(tensor_name='sparse'):
207207
'j_row_lengths2': [2, 1, 1],
208208
'k_val': [0, 1, 2, 3, 4, 5, 6, 7, 8],
209209
'l_val': [0, 1, 2, 3, 4, 5],
210-
'l_row_lengths1': [4, 2],
210+
'l_row_lengths1': [2, 1],
211211
}, {
212212
'a': 100,
213213
'b': 2.0,
@@ -227,7 +227,7 @@ def _sparse_value_name(tensor_name='sparse'):
227227
'j_row_lengths2': [1],
228228
'k_val': [9, 10, 11],
229229
'l_val': [6, 7],
230-
'l_row_lengths1': [2],
230+
'l_row_lengths1': [1],
231231
}],
232232
record_batch=_MULTIPLE_FEATURES_CASE_RECORD_BATCH,
233233
feed_dict=_FEED_DICT),
@@ -271,7 +271,7 @@ def _sparse_value_name(tensor_name='sparse'):
271271
'l_val':
272272
np.array([0, 1, 2, 3, 4, 5]),
273273
'l_row_lengths1':
274-
np.array([4, 2]),
274+
np.array([2, 1]),
275275
}, {
276276
'a': np.int64(100),
277277
'b': np.array(2.0, np.float32),
@@ -291,7 +291,7 @@ def _sparse_value_name(tensor_name='sparse'):
291291
'j_row_lengths2': np.array([1]),
292292
'k_val': np.array([9, 10, 11]),
293293
'l_val': np.array([6, 7]),
294-
'l_row_lengths1': np.array([2]),
294+
'l_row_lengths1': np.array([1]),
295295
}],
296296
record_batch=_MULTIPLE_FEATURES_CASE_RECORD_BATCH,
297297
feed_dict=_FEED_DICT),

0 commit comments

Comments
 (0)