Skip to content

Commit bdc64b4

Browse files
committed
Add try-except for duration parsing to handle ValueError and TypeError gracefully
1 parent 5e36f29 commit bdc64b4

File tree

3 files changed

+23
-5
lines changed

3 files changed

+23
-5
lines changed

infra/scripts/index_scripts/03_cu_process_data_text.py

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -215,7 +215,11 @@ def get_field_value(fields, field_name, default=""):
215215
conversation_id = file_name.split('convo_', 1)[1].split('_')[0]
216216
conversationIds.append(conversation_id)
217217
fields = result['result']['contents'][0]['fields']
218-
duration = int(get_field_value(fields, 'Duration', '0'))
218+
duration_str = get_field_value(fields, 'Duration', '0')
219+
try:
220+
duration = int(duration_str)
221+
except (ValueError, TypeError):
222+
duration = 0
219223
end_timestamp = str(start_timestamp + timedelta(seconds=duration)).split(".")[0]
220224
start_timestamp = str(start_timestamp).split(".")[0]
221225
summary = get_field_value(fields, 'summary')

infra/scripts/index_scripts/03_cu_process_data_text_manual.py

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -218,7 +218,11 @@ def get_field_value(fields, field_name, default=""):
218218
conversation_id = file_name.split('convo_', 1)[1].split('_')[0]
219219
conversationIds.append(conversation_id)
220220
fields = result['result']['contents'][0]['fields']
221-
duration = int(get_field_value(fields, 'Duration', '0'))
221+
duration_str = get_field_value(fields, 'Duration', '0')
222+
try:
223+
duration = int(duration_str)
224+
except (ValueError, TypeError):
225+
duration = 0
222226
end_timestamp = str(start_timestamp + timedelta(seconds=duration)).split(".")[0]
223227
start_timestamp = str(start_timestamp).split(".")[0]
224228
summary = get_field_value(fields, 'summary')

infra/scripts/index_scripts/04_cu_process_data_new_data.py

Lines changed: 13 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -286,8 +286,14 @@ def get_field_value(fields, field_name, default=""):
286286
start_timestamp = datetime.strptime(start_time, timestamp_format)
287287
conversation_id = file_name.split('convo_', 1)[1].split('_')[0]
288288
conversationIds.append(conversation_id)
289+
289290
fields = result['result']['contents'][0]['fields']
290-
duration = int(get_field_value(fields, 'Duration', '0'))
291+
duration_str = get_field_value(fields, 'Duration', '0')
292+
try:
293+
duration = int(duration_str)
294+
except (ValueError, TypeError):
295+
duration = 0
296+
291297
end_timestamp = str(start_timestamp + timedelta(seconds=duration)).split(".")[0]
292298
start_timestamp = str(start_timestamp).split(".")[0]
293299
summary = get_field_value(fields, 'summary')
@@ -340,11 +346,15 @@ def get_field_value(fields, field_name, default=""):
340346
timestamp_format = "%Y-%m-%d %H_%M_%S" # Adjust format if necessary
341347
start_timestamp = datetime.strptime(start_time, timestamp_format)
342348

343-
conversation_id = file_name.split('convo_', 1)[1].split('_')[0]
344349
conversationIds.append(conversation_id)
345350

346351
fields = result['result']['contents'][0]['fields']
347-
duration = int(get_field_value(fields, 'Duration', '0'))
352+
duration_str = get_field_value(fields, 'Duration', '0')
353+
try:
354+
duration = int(duration_str)
355+
except (ValueError, TypeError):
356+
duration = 0
357+
348358
end_timestamp = str(start_timestamp + timedelta(seconds=duration))
349359
end_timestamp = end_timestamp.split(".")[0]
350360
start_timestamp = str(start_timestamp).split(".")[0]

0 commit comments

Comments
 (0)