Skip to content

Commit 2a1bf11

Browse files
committed
fixed some comments
1 parent 6e957f6 commit 2a1bf11

File tree

2 files changed

+4
-4
lines changed

2 files changed

+4
-4
lines changed

notebooks/experiments/minutes_diarization/download_minutes.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -21,11 +21,11 @@ def download_minutes_pdfs():
2121
# Parse the HTML using selectolax
2222
tree = HTMLParser(response.content)
2323

24-
# Find all rows that contain filename divs
24+
# Find all divs with class row
2525
rows = tree.css("div.row")
2626

2727
for row in rows:
28-
# Find the filename div in this row
28+
# Find divs with class fileName
2929
filename_div = row.css_first("div.fileName")
3030
if not filename_div:
3131
continue

notebooks/experiments/minutes_diarization/process_min_diarization.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -39,7 +39,7 @@ def format_timestamp(seconds: float) -> str:
3939
secs = int(seconds % 60)
4040
return f"{hours:02d}:{minutes:02d}:{secs:02d}"
4141

42-
# Create formatted HTML output
42+
# Copied from John's transcription creator to simplify the diarization. Can probably turn this into a function or use the VTT instead.
4343
speaker_lines = ["Meeting Script - Combined by Speaker"]
4444

4545
current_speaker = None
@@ -99,7 +99,7 @@ def match_speakers_with_gemini(minutes_text, diarization):
9999
system_instruction=instruction,
100100
),
101101
)
102-
resp = chat.send_message("Show me all the market entities")
102+
resp = chat.send_message("Show me speaker identification")
103103

104104
result = resp.candidates[0].content.parts[0].text
105105
print(f"result: {result}")

0 commit comments

Comments
 (0)