codeforboston · Mephistic · Apr 22, 2025 · Mar 26, 2025 · Mar 27, 2025 · Apr 5, 2025
@@ -158,20 +158,6 @@ class HearingScraper extends EventScraper<HearingListItem, Hearing> {
     const hearing = Hearing.check(eventData)
 const content = HearingContent.check(await api.getHearing(EventId)) 
 const content = HearingContent.check(await api.getHearing(EventId)) 
     const shouldScrape = withinCutoff(hearing.startsAt.toDate())
 
-    let payload: Hearing = {
-      id: `hearing-${EventId}`,
-      type: "hearing",
-      content,
-      ...this.timestamps(content)
-    }
-    if (hearing) {
-      payload = {
-        ...payload,
-        videoURL: hearing.videoURL,
-        videoFetchedAt: hearing.videoFetchedAt,
-        videoAssemblyId: hearing.videoAssemblyId
-      }
-    }
     let maybeVideoURL = null
     let transcript = null
 
@@ -191,25 +177,32 @@ class HearingScraper extends EventScraper<HearingListItem, Hearing> {
             maybeVideoURL = firstVideoSource.src
 
             transcript = await assembly.transcripts.submit({
+              audio:
+                // test with: "https://assemblyaiusercontent.com/playground/aKUqpEtmYmI.flac",
+                firstVideoSource.src,
               webhook_url:
+                // test with: "https://ngrokid.ngrok-free.app/demo-dtp/us-central1/transcription",
                 process.env.NODE_ENV === "development"
                   ? "https://us-central1-digital-testimony-dev.cloudfunctions.net/transcription"
                   : "https://us-central1-digital-testimony-prod.cloudfunctions.net/transcription",
-              webhook_auth_header_name: "X-Maple-Webhook",
-              webhook_auth_header_value: newToken,
-              audio: firstVideoSource.src,
-              auto_highlights: true,
-              custom_topics: true,
-              entity_detection: true,
-              iab_categories: false,
-              format_text: true,
-              punctuate: true,
               speaker_labels: true,
-              summarization: true,
-              summary_model: "informative",
-              summary_type: "bullets"
+              webhook_auth_header_name: "x-maple-webhook",
+              webhook_auth_header_value: newToken
             })
 
+            await db
+              .collection("events")
+              .doc(`hearing-${String(EventId)}`)
+              .set({
+                id: `hearing-${EventId}`,
+                type: "hearing",
+                content,
+                ...this.timestamps(content),
+                videoURL: maybeVideoURL,
+                videoFetchedAt: Timestamp.now(),
+                videoAssemblyId: transcript.id
+              })
+
             await db
               .collection("events")
               .doc(`hearing-${String(EventId)}`)
@@ -218,20 +211,17 @@ class HearingScraper extends EventScraper<HearingListItem, Hearing> {
               .set({
                 videoAssemblyWebhookToken: sha256(newToken)
               })
-
-            payload = {
-              ...payload,
-              videoURL: maybeVideoURL,
-              videoFetchedAt: Timestamp.now(),
-              videoAssemblyId: transcript.id
-            }
           }
         }
       }
     }
 
-    const event: Hearing = payload
-    return event
+    return {
+      id: `hearing-${EventId}`,
+      type: "hearing",
+      content,
+      ...this.timestamps(content)
+    } as Hearing
   }
 }
 

@@ -8,23 +8,23 @@ const assembly = new AssemblyAI({
 })
 
 export const transcription = functions.https.onRequest(async (req, res) => {
-  if (
-    req.headers["X-Maple-Webhook"] &&
-    req.headers["webhook_auth_header_value"]
-  ) {
+  console.log("req.headers", req.headers)
+  if (req.headers["x-maple-webhook"]) {
+    console.log("req.body.status", req.body.status)
+
     if (req.body.status === "completed") {
       const transcript = await assembly.transcripts.get(req.body.transcript_id)
+      console.log("transcript.webhook_auth", transcript.webhook_auth)
       if (transcript && transcript.webhook_auth) {
         const maybeEventInDb = await db
           .collection("events")
           .where("videoAssemblyId", "==", transcript.id)
           .get()
+        console.log("maybeEventInDb.docs.length", maybeEventInDb.docs.length)
         if (maybeEventInDb.docs.length) {
           const authenticatedEventsInDb = maybeEventInDb.docs.filter(
             async e => {
-              const hashedToken = sha256(
-                String(req.headers["webhook_auth_header_value"])
-              )
+              const hashedToken = sha256(String(req.headers["x-maple-webhook"]))
 
               const tokenInDb = await db
                 .collection("events")
@@ -33,12 +33,16 @@ export const transcription = functions.https.onRequest(async (req, res) => {
                 .doc("webhookAuth")
                 .get()
               const tokenInDbData = tokenInDb.data()
+              console.log("tokenInDbData", tokenInDbData)
+
               if (tokenInDbData) {
                 return hashedToken === tokenInDbData.videoAssemblyWebhookToken
               }
               return false
             }
           )
+          console.log("authenticatedEventsInDb", authenticatedEventsInDb)
+
           if (authenticatedEventsInDb) {
             try {
               await db
@@ -48,7 +52,7 @@ export const transcription = functions.https.onRequest(async (req, res) => {
 
               authenticatedEventsInDb.forEach(async d => {
                 await d.ref.update({
-                  ["webhook_auth_header_value"]: null
+                  ["x-maple-webhook"]: null
                 })
               })
               console.log("transcript saved in db")