]*class=["'][^"']*content[^"']*["'][^>]*>([\s\S]*?)<\/div>/i,
+      /
]*class=["'][^"']*post[^"']*["'][^>]*>([\s\S]*?)<\/div>/i,
+      /]*>([\s\S]*?)<\/body>/i,
+    ];
+
+    let rawContent = '';
+    for (const pattern of contentPatterns) {
+      const match = html.match(pattern);
+      if (match?.[1]) {
+        rawContent = match[1];
+        break;
+      }
+    }
+
+    if (!rawContent) {
+      throw new Error('Could not extract content from page');
+    }
+
+    // Clean HTML and extract text
+    let content = rawContent
+      // Remove script and style tags
+      .replace(/