Add dynamic homepage generation with latest 5 blog posts

prabha-git · claude · prabha-git · commit 5d431e62c648 · 2025-10-05T22:29:19.000-05:00
- Created generate_index.py to automatically generate homepage with 5 most recent posts - Updated GitHub Actions workflow to run generation script before build - Added PyYAML dependency to requirements-doc.txt - Homepage now shows post title, date, tags, and excerpt with links 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com>
diff --git a/.github/workflows/mkdocs.yaml b/.github/workflows/mkdocs.yaml
@@ -26,6 +26,10 @@ jobs:
           python -m pip install --upgrade pip
           pip install -r requirements-doc.txt  # This file should list mkdocs and any other packages.
 
+      - name: Generate Index Page
+        run: |
+          python generate_index.py
+
       - name: Build the MkDocs Site
         run: |
           mkdocs build --verbose  # Build the site.
diff --git a/docs/index.md b/docs/index.md
@@ -1,17 +1,51 @@
 # Prabha Arivalagan
 
-AI Engineer 
+AI Engineer writing about agents, LLMs, and cloud infrastructure
 
-- Email: prabhakaran.mails@gmail.com
+## Recent Writing
 
-- [Github](https://github.com/prabha-git)
+### [Building AI Agents in Google Cloud: Choose the Right Approach for Your Needs](/writing/2025/10/04/agents-in-gcp/)
+**October 04, 2025** • adk, agent-framework
 
-- [Medium Blog](https://medium.com/@prabhakaran_arivalagan) 
+- ADK → Google-developed open-source framework for building complex multi-agent systems with maximum control and modularity - Conversational Agents (Dialogflow CX) → Omnichannel...
 
-- [x / Twitter](https://twitter.com/prabhatweet)
+[Read more →](/writing/2025/10/04/agents-in-gcp/)
+
+### [The Language of Agents - Decoding Messages in LangChain & LangGraph](/writing/2025/05/13/the-language-of-agents/)
+**May 13, 2025** • llm
+
+Ever wondered how apps get AI to chat, follow instructions, or even use tools? A lot of the magic comes down to "messages." Think of them as the notes passed between you, the AI,...
+
+[Read more →](/writing/2025/05/13/the-language-of-agents/)
+
+### [Building Personal Chatbot - Part 2](/writing/2024/08/18/building-obsidian-kb-chatbot/)
+**August 18, 2024** • llm
+
+In our previous post, we explored building a chatbot for Obsidian notes using Langchain and basic Retrieval-Augmented Generation (RAG) techniques. Today, I am sharing the...
 
+[Read more →](/writing/2024/08/18/building-obsidian-kb-chatbot/)
 
+### [Building an Obsidian Knowledge base Chatbot: A Journey of Iteration and Learning](/writing/2024/04/29/building-obsidian-kb-chatbot/)
+**April 29, 2024** • llm, obsidian-kb
 
+As an avid Obsidian user, I've always been fascinated by the potential of leveraging my daily notes as a personal knowledge base. Obsidian has become my go-to tool for taking...
 
+[Read more →](/writing/2024/04/29/building-obsidian-kb-chatbot/)
 
+### [Quantized LLM Models](/writing/2024/04/19/quantized-llm-models/)
+**April 19, 2024** • llm
 
+Large Language Models (LLMs) are known for their vast number of parameters, often reaching billions. For example, open-source models like Llama2 come in sizes of 7B, 13B, and 70B...
+
+[Read more →](/writing/2024/04/19/quantized-llm-models/)
+
+---
+
+[View all posts →](/writing/)
+
+## Contact
+
+- Email: prabhakaran.mails@gmail.com
+- [Github](https://github.com/prabha-git)
+- [Medium Blog](https://medium.com/@prabhakaran_arivalagan)
+- [x / Twitter](https://twitter.com/prabhatweet)
diff --git a/generate_index.py b/generate_index.py
@@ -0,0 +1,170 @@
+#!/usr/bin/env python3
+"""
+Generate index.md with the latest 5 blog posts.
+This script scans all posts in docs/writing/posts/ and creates a homepage
+with the most recent posts including title, date, tags, and excerpt.
+"""
+
+import os
+import glob
+import re
+import yaml
+from datetime import datetime, date
+
+def extract_frontmatter_and_content(file_path):
+    """Extract YAML frontmatter and content from a markdown file."""
+    with open(file_path, 'r', encoding='utf-8') as f:
+        content = f.read()
+
+    # Match frontmatter between --- markers
+    match = re.match(r'^---\s*\n(.*?)\n---\s*\n(.*)', content, re.DOTALL)
+    if not match:
+        return None, content
+
+    frontmatter_text = match.group(1)
+    markdown_content = match.group(2)
+
+    try:
+        frontmatter = yaml.safe_load(frontmatter_text)
+    except yaml.YAMLError:
+        return None, markdown_content
+
+    return frontmatter, markdown_content
+
+def extract_excerpt(content, max_length=200):
+    """Extract an excerpt from markdown content."""
+    # Remove markdown headers
+    content = re.sub(r'^#+\s+.*$', '', content, flags=re.MULTILINE)
+    # Remove markdown links but keep text
+    content = re.sub(r'\[([^\]]+)\]\([^\)]+\)', r'\1', content)
+    # Remove markdown formatting
+    content = re.sub(r'[*_`]', '', content)
+    # Remove extra whitespace
+    content = re.sub(r'\s+', ' ', content).strip()
+
+    # Get first meaningful content
+    if len(content) > max_length:
+        content = content[:max_length].rsplit(' ', 1)[0] + '...'
+
+    return content
+
+def parse_date(date_value):
+    """Parse date from various formats to datetime object."""
+    if isinstance(date_value, datetime):
+        return date_value
+    if isinstance(date_value, date):
+        # Convert date to datetime for consistent handling
+        return datetime.combine(date_value, datetime.min.time())
+    if isinstance(date_value, str):
+        try:
+            return datetime.strptime(date_value, '%Y-%m-%d')
+        except ValueError:
+            pass
+    return None
+
+def format_date(date_obj):
+    """Format datetime object to readable string."""
+    if date_obj:
+        return date_obj.strftime('%B %d, %Y')
+    return ''
+
+def generate_post_url(date_obj, slug):
+    """Generate URL for a blog post based on date and slug."""
+    if date_obj and slug:
+        return f"/writing/{date_obj.year}/{date_obj.month:02d}/{date_obj.day:02d}/{slug}/"
+    return "/writing/"
+
+def generate_index():
+    """Generate the index.md file with the latest 5 blog posts."""
+    posts_dir = 'docs/writing/posts'
+    post_files = glob.glob(f'{posts_dir}/*.md')
+
+    posts = []
+    for file_path in post_files:
+        frontmatter, content = extract_frontmatter_and_content(file_path)
+        if not frontmatter:
+            continue  # Skip posts without frontmatter
+
+        # Skip drafts
+        if frontmatter.get('draft') is True:
+            continue
+
+        # Extract metadata
+        date_obj = parse_date(frontmatter.get('date'))
+        slug = frontmatter.get('slug', '')
+        tags = frontmatter.get('tags', [])
+
+        # Try to get title from content (first # header)
+        title_match = re.search(r'^#\s+(.+)$', content, re.MULTILINE)
+        title = title_match.group(1).strip() if title_match else os.path.basename(file_path).replace('.md', '')
+
+        # Get excerpt
+        excerpt = extract_excerpt(content, max_length=180)
+
+        posts.append({
+            'title': title,
+            'date': date_obj,
+            'slug': slug,
+            'tags': tags,
+            'excerpt': excerpt,
+        })
+
+    # Sort by date (newest first), handling None dates
+    posts.sort(key=lambda x: x['date'] if x['date'] else datetime.min, reverse=True)
+
+    # Take top 5
+    recent_posts = posts[:5]
+
+    # Generate index.md content
+    index_content = """# Prabha Arivalagan
+
+AI Engineer writing about agents, LLMs, and cloud infrastructure
+
+## Recent Writing
+
+"""
+
+    for post in recent_posts:
+        date_str = format_date(post['date'])
+        tags_str = ', '.join(post['tags']) if post['tags'] else ''
+        post_url = generate_post_url(post['date'], post['slug'])
+
+        # Post title (linked)
+        index_content += f"### [{post['title']}]({post_url})\n"
+
+        # Date and tags
+        index_content += f"**{date_str}**"
+        if tags_str:
+            index_content += f" • {tags_str}"
+        index_content += "\n\n"
+
+        # Excerpt
+        if post['excerpt']:
+            index_content += f"{post['excerpt']}\n\n"
+
+        # Read more link
+        index_content += f"[Read more →]({post_url})\n\n"
+
+    # Footer with link to all posts and contact info
+    index_content += """---
+
+[View all posts →](/writing/)
+
+## Contact
+
+- Email: prabhakaran.mails@gmail.com
+- [Github](https://github.com/prabha-git)
+- [Medium Blog](https://medium.com/@prabhakaran_arivalagan)
+- [x / Twitter](https://twitter.com/prabhatweet)
+"""
+
+    # Write to docs/index.md
+    with open('docs/index.md', 'w', encoding='utf-8') as f:
+        f.write(index_content)
+
+    print(f"✅ Generated index.md with {len(recent_posts)} recent posts")
+    for post in recent_posts:
+        print(f"   - {post['title']} ({format_date(post['date'])})")
+
+if __name__ == '__main__':
+    generate_index()
diff --git a/requirements-doc.txt b/requirements-doc.txt
@@ -5,3 +5,4 @@ mkdocstrings-python
 mkdocs-minify-plugin
 mkdocs-rss-plugin
 mkdocs-redirects
+PyYAML