feat: add llms.txt and llmx-full.txt

thedaviddias · thedaviddias · commit db396059b258 · 2025-02-18T17:11:30.000-05:00
diff --git a/app/[lang]/llms-full.txt/route.ts b/app/[lang]/llms-full.txt/route.ts
@@ -0,0 +1,146 @@
+import fg from 'fast-glob';
+import matter from 'gray-matter';
+import { NextResponse } from 'next/server';
+import * as fs from 'node:fs/promises';
+import path from 'node:path';
+import { remark } from 'remark';
+import remarkGfm from 'remark-gfm';
+import remarkStringify from 'remark-stringify';
+
+export const dynamic = 'force-dynamic';
+
+// Regular expressions for cleaning up the content
+const IMPORT_REGEX = /import\s+?(?:(?:{[^}]*}|\*|\w+)\s+from\s+)?['"](.*?)['"];?\n?/g;
+const COMPONENT_USAGE_REGEX = /<[A-Z][a-zA-Z]*(?:\s+[^>]*)?(?:\/?>|>[^<]*<\/[A-Z][a-zA-Z]*>)/g;
+const NEXTRA_COMPONENT_REGEX = /<(?:Callout|Steps|Tabs|Tab|FileTree)[^>]*>[^<]*<\/(?:Callout|Steps|Tabs|Tab|FileTree)>/g;
+const MDX_EXPRESSION_REGEX = /{(?:[^{}]|{[^{}]*})*}/g;
+const EXPORT_REGEX = /export\s+(?:default\s+)?(?:const|let|var|function|class|interface|type)?\s+[a-zA-Z_$][0-9a-zA-Z_$]*[\s\S]*?(?:;|\n|$)/g;
+
+async function processContent(content: string): Promise<string> {
+  try {
+    // Multi-step cleanup to handle different MDX constructs
+    const cleanContent = content
+      // Remove imports first
+      .replace(IMPORT_REGEX, '')
+      // Remove exports
+      .replace(EXPORT_REGEX, '')
+      // Remove Nextra components with their content
+      .replace(NEXTRA_COMPONENT_REGEX, '')
+      // Remove other React components
+      .replace(COMPONENT_USAGE_REGEX, '')
+      // Remove MDX expressions
+      .replace(MDX_EXPRESSION_REGEX, '')
+      // Clean up multiple newlines
+      .replace(/\n{3,}/g, '\n\n')
+      // Remove empty JSX expressions
+      .replace(/{[\s]*}/g, '')
+      // Clean up any remaining JSX-like syntax
+      .replace(/<>[\s\S]*?<\/>/g, '')
+      .replace(/{\s*\/\*[\s\S]*?\*\/\s*}/g, '')
+      .trim();
+
+    // Simple markdown processing without MDX
+    const file = await remark()
+      .use(remarkGfm)
+      .use(remarkStringify)
+      .process(cleanContent);
+
+    return String(file);
+  } catch (error) {
+    console.error('Error processing content:', error);
+    // If processing fails, return a basic cleaned version
+    return content
+      .replace(IMPORT_REGEX, '')
+      .replace(COMPONENT_USAGE_REGEX, '')
+      .replace(MDX_EXPRESSION_REGEX, '')
+      .trim();
+  }
+}
+
+interface ProcessFileOptions {
+  baseUrl: string;
+  lang: string;
+}
+
+async function processFile(file: string, options: ProcessFileOptions) {
+  try {
+    const fileContent = await fs.readFile(file);
+    const { content, data } = matter(fileContent.toString());
+
+    // Get the filename without extension to use as fallback title
+    const basename = path.basename(file, '.mdx');
+
+    // Extract category from file path
+    const pathParts = path.dirname(file).split(path.sep);
+    const category = pathParts.length > 3 && pathParts[3] ? pathParts[3] : 'general';
+
+    // Skip if the file is marked as hidden or draft
+    if (data.draft || data.hidden) {
+      return null;
+    }
+
+    // Use filename as title if no title in frontmatter, and convert to Title Case
+    const title = data.title || basename.split('-')
+      .map(word => word.charAt(0).toUpperCase() + word.slice(1))
+      .join(' ');
+
+    const processed = await processContent(content);
+    const patternUrl = new URL(
+      `/${options.lang}/patterns/${category}/${basename}`,
+      options.baseUrl
+    ).toString();
+
+    return `# ${category.toUpperCase()}: [${title}](${patternUrl})
+
+${data.description || ''}
+
+${processed}`;
+  } catch (error) {
+    console.error(`Error processing file ${file}:`, error);
+    return null;
+  }
+}
+
+export async function GET(
+  _request: Request,
+  { params }: { params: { lang: string } }
+) {
+  try {
+    // Get base URL and await params
+    const [baseUrl, { lang }] = await Promise.all([
+      Promise.resolve(
+        process.env.NEXT_PUBLIC_VERCEL_URL
+          ? `https://${process.env.NEXT_PUBLIC_VERCEL_URL}`
+          : process.env.NODE_ENV === 'development'
+            ? 'http://localhost:3000'
+            : ''
+      ),
+      params
+    ]);
+
+    if (!baseUrl) {
+      return NextResponse.json({ error: 'Base URL not configured' }, { status: 500 });
+    }
+
+    // Get files and process them
+    const files = await fg(['content/en/patterns/**/*.mdx']);
+    const options: ProcessFileOptions = { baseUrl, lang };
+
+    const scanned = (await Promise.all(
+      files.map(file => processFile(file, options))
+    )).filter(Boolean);
+
+    if (!scanned.length) {
+      return NextResponse.json({ error: 'No content found' }, { status: 404 });
+    }
+
+    return new Response(scanned.join('\n\n'), {
+      headers: {
+        'Content-Type': 'text/plain',
+      },
+    });
+  } catch (error) {
+    console.error('Error generating LLM content:', error);
+    return NextResponse.json({ error: 'Internal Server Error' }, { status: 500 });
+  }
+}
diff --git a/app/[lang]/llms.txt/route.ts b/app/[lang]/llms.txt/route.ts
@@ -1,112 +1,117 @@
-import fg from 'fast-glob';
 import matter from 'gray-matter';
-import * as fs from 'node:fs/promises';
+import { NextResponse } from 'next/server';
+import fs from 'node:fs';
 import path from 'node:path';
-import { remark } from 'remark';
-import remarkGfm from 'remark-gfm';
-import remarkStringify from 'remark-stringify';
 
-export const revalidate = false;
+const contentDirectory = path.join(process.cwd(), 'content/en/patterns');
 
-// Regular expressions for cleaning up the content
-const IMPORT_REGEX = /import\s+?(?:(?:{[^}]*}|\*|\w+)\s+from\s+)?['"](.*?)['"];?\n?/g;
-const COMPONENT_USAGE_REGEX = /<[A-Z][a-zA-Z]*(?:\s+[^>]*)?(?:\/?>|>[^<]*<\/[A-Z][a-zA-Z]*>)/g;
-const NEXTRA_COMPONENT_REGEX = /<(?:Callout|Steps|Tabs|Tab|FileTree)[^>]*>[^<]*<\/(?:Callout|Steps|Tabs|Tab|FileTree)>/g;
-const MDX_EXPRESSION_REGEX = /{(?:[^{}]|{[^{}]*})*}/g;
-const EXPORT_REGEX = /export\s+(?:default\s+)?(?:const|let|var|function|class|interface|type)?\s+[a-zA-Z_$][0-9a-zA-Z_$]*[\s\S]*?(?:;|\n|$)/g;
+interface Pattern {
+  category: string;
+  title: string;
+  summary: string;
+  status: string;
+  slug: string;
+}
 
-export async function GET() {
-  try {
-    const files = await fg(['content/en/patterns/**/*.mdx']);
-
-    const scan = files.map(async (file) => {
-      try {
-        const fileContent = await fs.readFile(file);
-        const { content, data } = matter(fileContent.toString());
-
-        // Get the filename without extension to use as fallback title
-        const basename = path.basename(file, '.mdx');
-
-        // Extract category from file path
-        const pathParts = path.dirname(file).split(path.sep);
-        let category = 'general';
-        if (pathParts.length > 3 && pathParts[3]) {
-          category = pathParts[3];
-        }
-
-        // Skip if the file is marked as hidden or draft
-        if (data.draft || data.hidden) {
-          return null;
-        }
-
-        // Use filename as title if no title in frontmatter, and convert to Title Case
-        const title = data.title || basename.split('-')
-          .map(word => word.charAt(0).toUpperCase() + word.slice(1))
-          .join(' ');
-
-        const processed = await processContent(content);
-        return `File: ${file}
-# ${category.toUpperCase()}: ${title}
-
-${data.description || ''}
-
-${processed}`;
-      } catch (error) {
-        console.error(`Error processing file ${file}:`, error);
-        return null;
-      }
-    });
+interface PatternsByCategory {
+  [category: string]: Pattern[];
+}
 
-    const scanned = (await Promise.all(scan)).filter(Boolean);
+function slugify(text: string): string {
+  return text
+    .toLowerCase()
+    .replace(/[^a-z0-9]+/g, '-')
+    .replace(/(^-|-$)/g, '');
+}
 
-    if (!scanned.length) {
-      return new Response('No content found', { status: 404 });
-    }
+function getAllPatterns(): PatternsByCategory {
+  // Get all directories under patterns
+  const categories = fs.readdirSync(contentDirectory);
 
-    return new Response(scanned.join('\n\n'));
-  } catch (error) {
-    console.error('Error generating LLM content:', error);
-    return new Response('Internal Server Error', { status: 500 });
+  const allPatterns: PatternsByCategory = {};
+
+  for (const category of categories) {
+    const categoryPath = path.join(contentDirectory, category);
+
+    // Skip if not a directory
+    if (!fs.statSync(categoryPath).isDirectory()) continue;
+
+    // Read all MDX files in the category
+    const files = fs.readdirSync(categoryPath)
+      .filter(file => file.endsWith('.mdx'));
+
+    const categoryPatterns = files.map(file => {
+      const fullPath = path.join(categoryPath, file);
+      const fileContents = fs.readFileSync(fullPath, 'utf8');
+      const { data } = matter(fileContents);
+      const slug = file.replace('.mdx', '');
+
+      return {
+        category,
+        title: data.title || slug,
+        summary: data.summary || '',
+        status: data.status || 'coming soon',
+        slug
+      };
+    });
+
+    allPatterns[category] = categoryPatterns;
   }
+
+  return allPatterns;
 }
 
-async function processContent(content: string): Promise<string> {
+export async function GET(
+  request: Request,
+  { params }: { params: { lang: string } }
+) {
   try {
-    // Multi-step cleanup to handle different MDX constructs
-    let cleanContent = content
-      // Remove imports first
-      .replace(IMPORT_REGEX, '')
-      // Remove exports
-      .replace(EXPORT_REGEX, '')
-      // Remove Nextra components with their content
-      .replace(NEXTRA_COMPONENT_REGEX, '')
-      // Remove other React components
-      .replace(COMPONENT_USAGE_REGEX, '')
-      // Remove MDX expressions
-      .replace(MDX_EXPRESSION_REGEX, '')
-      // Clean up multiple newlines
-      .replace(/\n{3,}/g, '\n\n')
-      // Remove empty JSX expressions
-      .replace(/{[\s]*}/g, '')
-      // Clean up any remaining JSX-like syntax
-      .replace(/<>[\s\S]*?<\/>/g, '')
-      .replace(/{\s*\/\*[\s\S]*?\*\/\s*}/g, '')
-      .trim();
-
-    // Simple markdown processing without MDX
-    const file = await remark()
-      .use(remarkGfm)
-      .use(remarkStringify)
-      .process(cleanContent);
-
-    return String(file);
+    const patterns = getAllPatterns();
+
+    // Get base URL and await params
+    const [baseUrl, { lang }] = await Promise.all([
+      Promise.resolve(
+        process.env.NODE_ENV === 'development'
+          ? 'http://localhost:3000'
+          : `https://${process.env.NEXT_PUBLIC_VERCEL_URL || 'localhost:3000'}`
+      ),
+      params
+    ]);
+
+    // Generate the text content
+    let content = `# UX Patterns for Developers
+
+## Overview
+This is an automatically generated overview of all UX patterns documented in this project.
+
+## Pattern Categories\n`;
+
+    // Add patterns by category
+    for (const [category, categoryPatterns] of Object.entries(patterns)) {
+      content += `\n### ${category.charAt(0).toUpperCase() + category.slice(1)}\n`;
+      for (const pattern of categoryPatterns) {
+        const patternUrl = `${baseUrl}/${lang}/patterns/${category}/${pattern.slug}`;
+        content += `- [${pattern.title}](${patternUrl})${pattern.summary ? `: ${pattern.summary}` : ''} [${pattern.status}]\n`;
+      }
+    }
+
+    content += `\n## Additional Resources
+- [Blog posts and articles about UX patterns](${baseUrl}/${lang}/blog)
+- [Comprehensive glossary of UX terms](${baseUrl}/${lang}/glossary)
+
+## Technical Implementation
+- Built with Next.js and TypeScript
+- MDX-based pattern documentation
+- Accessibility-first approach
+- Comprehensive testing guidelines`;
+
+    return new NextResponse(content, {
+      headers: {
+        'Content-Type': 'text/plain',
+      },
+    });
   } catch (error) {
-    console.error('Error processing content:', error);
-    // If processing fails, return a basic cleaned version
-    return content
-      .replace(IMPORT_REGEX, '')
-      .replace(COMPONENT_USAGE_REGEX, '')
-      .replace(MDX_EXPRESSION_REGEX, '')
-      .trim();
+    console.error('Error generating content:', error);
+    return NextResponse.json({ error: 'Internal Server Error' }, { status: 500 });
   }
 }
diff --git a/app/_constants/footer.ts b/app/_constants/footer.ts
@@ -11,12 +11,20 @@ export const FOOTER_MENU_LINKS = (lang: string) => [
     path: `/${lang}/blog`,
     label: 'Blog'
   },
+  {
+    path: `/${lang}/llms.txt`,
+    label: 'LLMs'
+  },
+  {
+    path: `/${lang}/llms-full.txt`,
+    label: 'LLMs Full'
+  },
   {
     path: `/${lang}/about`,
     label: 'About'
   },
   {
     path: `/${lang}/privacy-policy`,
     label: 'Privacy Policy'
-  },
+  }
 ]
diff --git a/middleware.ts b/middleware.ts
@@ -3,6 +3,6 @@ export { middleware } from 'nextra/locales'
 export const config = {
   // Matcher ignoring `/_next/` and `/api/`
   matcher: [
-    '/((?!api/mdx|api/email|api/patterns/random|api/og|_next/static|_next/image|llms.txt|favicon.ico|robots.txt|og/opengraph-image.png|covers|twitter-image|sitemap.xml|6ba7b811-9dad-11d1-80b4.txt|43mg4ybv6sxxanu24g7dngawd9up5w93.txt|apple-icon.png|manifest|_pagefind|examples).*)'
+    '/((?!api/mdx|api/email|api/patterns/random|api/og|_next/static|_next/image|llms-full.txt|llms.txt|favicon.ico|robots.txt|og/opengraph-image.png|covers|twitter-image|sitemap.xml|6ba7b811-9dad-11d1-80b4.txt|43mg4ybv6sxxanu24g7dngawd9up5w93.txt|apple-icon.png|manifest|_pagefind|examples).*)'
   ]
 }
diff --git a/next.config.ts b/next.config.ts

Original file line number	Diff line number	Diff line change
`@@ -3,6 +3,6 @@ export { middleware } from 'nextra/locales'`
`3`	`3`	`export const config = {`
`4`	`4`	// Matcher ignoring `/_next/` and `/api/`
`5`	`5`	`matcher: [`
`6`		`- '/((?!api/mdx\|api/email\|api/patterns/random\|api/og\|_next/static\|_next/image\|llms.txt\|favicon.ico\|robots.txt\|og/opengraph-image.png\|covers\|twitter-image\|sitemap.xml\|6ba7b811-9dad-11d1-80b4.txt\|43mg4ybv6sxxanu24g7dngawd9up5w93.txt\|apple-icon.png\|manifest\|_pagefind\|examples).*)'`
	`6`	`+ '/((?!api/mdx\|api/email\|api/patterns/random\|api/og\|_next/static\|_next/image\|llms-full.txt\|llms.txt\|favicon.ico\|robots.txt\|og/opengraph-image.png\|covers\|twitter-image\|sitemap.xml\|6ba7b811-9dad-11d1-80b4.txt\|43mg4ybv6sxxanu24g7dngawd9up5w93.txt\|apple-icon.png\|manifest\|_pagefind\|examples).*)'`
`7`	`7`	`]`
`8`	`8`	`}`