danielsobrado
diff --git a/‎gpt2-comprehensive-animation/README.md‎
Lines changed: 68 additions & 0 deletions b/‎gpt2-comprehensive-animation/README.md‎
Lines changed: 68 additions & 0 deletions
diff --git a/‎gpt2-comprehensive-animation/index.html‎
Lines changed: 15 additions & 0 deletions b/‎gpt2-comprehensive-animation/index.html‎
Lines changed: 15 additions & 0 deletions
diff --git a/‎gpt2-comprehensive-animation/package.json‎
Lines changed: 27 additions & 0 deletions b/‎gpt2-comprehensive-animation/package.json‎
Lines changed: 27 additions & 0 deletions
diff --git a/‎gpt2-comprehensive-animation/postcss.config.js‎
Lines changed: 6 additions & 0 deletions b/‎gpt2-comprehensive-animation/postcss.config.js‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎gpt2-comprehensive-animation/src/App.jsx‎
Lines changed: 93 additions & 0 deletions b/‎gpt2-comprehensive-animation/src/App.jsx‎
Lines changed: 93 additions & 0 deletions
diff --git a/‎gpt2-comprehensive-animation/src/index.css‎
Lines changed: 19 additions & 0 deletions b/‎gpt2-comprehensive-animation/src/index.css‎
Lines changed: 19 additions & 0 deletions
diff --git a/‎gpt2-comprehensive-animation/src/main.jsx‎
Lines changed: 13 additions & 0 deletions b/‎gpt2-comprehensive-animation/src/main.jsx‎
Lines changed: 13 additions & 0 deletions
diff --git a/‎gpt2-comprehensive-animation/src/steps/Step1Tokenization.jsx‎
Lines changed: 132 additions & 0 deletions b/‎gpt2-comprehensive-animation/src/steps/Step1Tokenization.jsx‎
Lines changed: 132 additions & 0 deletions
@@ -0,0 +1,68 @@
+# GPT-2 Comprehensive Animation
+
+An interactive, multi-step educational journey through GPT-2 architecture and training optimizations.
+
+## Overview
+
+This project provides a deep dive into GPT-2, covering:
+
+### Implemented Steps (Phase 1)
+1. **Tokenization & Embeddings**: BPE tokenization, learned embeddings
+2. **Positional Encoding**: Learned absolute position embeddings  
+3. **Multi-Head Self-Attention**: Q/K/V projections, causal masking, multi-head mechanism
+
+### Coming Soon (Phase 2)
+4. Feed-Forward Network
+5. Layer Normalization & Residual Connections
+6. Full Architecture Overview
+7. Weight Tying Optimization
+8. Training Optimizations (gradient accumulation, mixed precision, etc.)
+9. Inference Optimizations (KV cache, sampling strategies)
+
+## Features
+
+- **Interactive Visualizations**: Three.js for 3D attention patterns, Canvas for positional encoding
+- **Hands-on Exercises**: Quiz questions to validate understanding after each step
+- **Progress Tracking**: Navigate through steps, mark completion
+- **Dark Theme**: Easy on the eyes during long study sessions
+
+## Getting Started
+
+```bash
+# Install dependencies
+npm install
+
+# Run development server
+npm run dev
+```
+
+## Learning Objectives
+
+After completing all steps, you will understand:
+- How text is converted to numerical representations
+- The self-attention mechanism that powers transformers
+- Why GPT-2 uses causal masking for autoregressive generation
+- Training and inference optimizations that make GPT-2 practical
+
+## Project Structure
+
+```
+src/
+├── App.jsx                 # Main app with navigation
+├── stepsConfig.js          # Step definitions
+└── steps/
+    ├── Step1Tokenization.jsx
+    ├── Step2Positional.jsx
+    └── Step3Attention.jsx
+```
+
+## Extending This Project
+
+To add Step 4 and beyond:
+1. Create new component in `src/steps/`
+2. Add route in `App.jsx`
+3. Update `stepsConfig.js`
+
+## License
+
+MIT
@@ -0,0 +1,15 @@
+<!doctype html>
+<html lang="en">
+
+<head>
+    <meta charset="UTF-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" />
+    <title>GPT-2 Comprehensive Animation</title>
+</head>
+
+<body>
+    <div id="root"></div>
+    <script type="module" src="/src/main.jsx"></script>
+</body>
+
+</html>
@@ -0,0 +1,27 @@
+{
+  "name": "gpt2-comprehensive-animation",
+  "version": "1.0.0",
+  "type": "module",
+  "scripts": {
+    "dev": "vite",
+    "build": "vite build",
+    "preview": "vite preview"
+  },
+  "dependencies": {
+    "gsap": "^3.12.2",
+    "react": "^18.2.0",
+    "react-dom": "^18.2.0",
+    "react-router-dom": "^6.16.0",
+    "three": "^0.158.0",
+    "prismjs": "^1.29.0"
+  },
+  "devDependencies": {
+    "@types/react": "^18.2.15",
+    "@types/react-dom": "^18.2.7",
+    "@vitejs/plugin-react": "^4.0.3",
+    "autoprefixer": "^10.4.16",
+    "postcss": "^8.4.31",
+    "tailwindcss": "^3.3.5",
+    "vite": "^5.0.0"
+  }
+}
@@ -0,0 +1,6 @@
+export default {
+    plugins: {
+        tailwindcss: {},
+        autoprefixer: {},
+    },
+}
@@ -0,0 +1,93 @@
+import React, { useState } from 'react';
+import { Routes, Route, useNavigate, useLocation } from 'react-router-dom';
+import { steps } from './stepsConfig';
+import Step1Tokenization from './steps/Step1Tokenization';
+import Step2Positional from './steps/Step2Positional';
+import Step3Attention from './steps/Step3Attention';
+
+export default function App() {
+    const [completedSteps, setCompletedSteps] = useState(new Set());
+    const navigate = useNavigate();
+    const location = useLocation();
+
+    const currentStepId = steps.find(s => s.path === location.pathname)?.id || 1;
+
+    const markComplete = (stepId) => {
+        setCompletedSteps(prev => new Set([...prev, stepId]));
+    };
+
+    const goToNext = () => {
+        const currentIndex = steps.findIndex(s => s.id === currentStepId);
+        if (currentIndex < steps.length - 1) {
+            navigate(steps[currentIndex + 1].path);
+        }
+    };
+
+    const goToPrev = () => {
+        const currentIndex = steps.findIndex(s => s.id === currentStepId);
+        if (currentIndex > 0) {
+            navigate(steps[currentIndex - 1].path);
+        }
+    };
+
+    return (
+        <div className="min-h-screen bg-gray-900 text-gray-100">
+            {/* Header */}
+            <header className="bg-gray-800 border-b border-gray-700 px-6 py-4">
+                <div className="max-w-7xl mx-auto flex items-center justify-between">
+                    <h1 className="text-2xl font-bold text-emerald-400">GPT-2 Deep Dive</h1>
+                    <div className="text-sm text-gray-400">
+                        Step {currentStepId} of {steps.length}
+                    </div>
+                </div>
+            </header>
+
+            {/* Main Content */}
+            <div className="flex">
+                {/* Sidebar */}
+                <aside className="w-64 bg-gray-800 min-h-[calc(100vh-73px)] border-r border-gray-700 p-4">
+                    <nav>
+                        <ul className="space-y-2">
+                            {steps.map((step) => (
+                                <li key={step.id}>
+                                    <button
+                                        onClick={() => navigate(step.path)}
+                                        className={`w-full text-left px-4 py-3 rounded-lg transition-colors ${currentStepId === step.id
+                                                ? 'bg-emerald-600 text-white'
+                                                : completedSteps.has(step.id)
+                                                    ? 'bg-gray-700 text-emerald-400'
+                                                    : 'bg-gray-700 text-gray-300 hover:bg-gray-600'
+                                            }`}
+                                    >
+                                        <div className="flex items-center gap-2">
+                                            <span className="font-mono text-xs">{step.id}</span>
+                                            <div className="flex-1">
+                                                <div className="font-semibold text-sm">{step.title}</div>
+                                                <div className="text-xs opacity-75">{step.description}</div>
+                                            </div>
+                                            {completedSteps.has(step.id) && (
+                                                <span className="text-emerald-400">✓</span>
+                                            )}
+                                        </div>
+                                    </button>
+                                </li>
+                            ))}
+                        </ul>
+                    </nav>
+                </aside>
+
+                {/* Content */}
+                <main className="flex-1 p-8">
+                    <div className="max-w-4xl mx-auto">
+                        <Routes>
+                            <Route path="/" element={<Step1Tokenization onComplete={() => markComplete(1)} onNext={goToNext} />} />
+                            <Route path="/step1" element={<Step1Tokenization onComplete={() => markComplete(1)} onNext={goToNext} />} />
+                            <Route path="/step2" element={<Step2Positional onComplete={() => markComplete(2)} onNext={goToNext} onPrev={goToPrev} />} />
+                            <Route path="/step3" element={<Step3Attention onComplete={() => markComplete(3)} onNext={goToNext} onPrev={goToPrev} />} />
+                        </Routes>
+                    </div>
+                </main>
+            </div>
+        </div>
+    );
+}
@@ -0,0 +1,19 @@
+@tailwind base;
+@tailwind components;
+@tailwind utilities;
+
+@import 'prismjs/themes/prism-tomorrow.css';
+
+body {
+  margin: 0;
+  font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', 'Roboto', 'Oxygen',
+    'Ubuntu', 'Cantarell', 'Fira Sans', 'Droid Sans', 'Helvetica Neue',
+    sans-serif;
+  -webkit-font-smoothing: antialiased;
+  -moz-osx-font-smoothing: grayscale;
+}
+
+code {
+  font-family: source-code-pro, Menlo, Monaco, Consolas, 'Courier New',
+    monospace;
+}
@@ -0,0 +1,13 @@
+import React from 'react'
+import ReactDOM from 'react-dom/client'
+import { BrowserRouter } from 'react-router-dom'
+import App from './App.jsx'
+import './index.css'
+
+ReactDOM.createRoot(document.getElementById('root')).render(
+    <React.StrictMode>
+        <BrowserRouter>
+            <App />
+        </BrowserRouter>
+    </React.StrictMode>,
+)
@@ -0,0 +1,132 @@
+import React, { useState } from 'react';
+
+export default function Step1Tokenization({ onComplete, onNext }) {
+    const [inputText, setInputText] = useState("Hello, GPT-2!");
+    const [tokens, setTokens] = useState([]);
+    const [quizAnswer, setQuizAnswer] = useState('');
+    const [quizFeedback, setQuizFeedback] = useState('');
+
+    // Simplified BPE tokenization simulation
+    const tokenize = (text) => {
+        // Simple word-level tokenization for demonstration
+        const simpleTokens = text.split(/(\s+|[,.!?])/g).filter(t => t.trim());
+        setTokens(simpleTokens);
+    };
+
+    const checkQuiz = () => {
+        const correct = quizAnswer.toLowerCase().includes('subword');
+        setQuizFeedback(correct
+            ? '✓ Correct! BPE breaks text into subword units, allowing the model to handle unknown words.'
+            : '✗ Try again. Think about how BPE handles rare or unknown words.'
+        );
+        if (correct) onComplete();
+    };
+
+    return (
+        <div className="space-y-8">
+            <div>
+                <h2 className="text-3xl font-bold mb-2">Step 1: Tokenization & Embeddings</h2>
+                <p className="text-gray-400">How text becomes numbers that GPT-2 can understand</p>
+            </div>
+
+            {/* Explanation */}
+            <div className="bg-gray-800 rounded-lg p-6 space-y-4">
+                <h3 className="text-xl font-semibold text-emerald-400">What is Tokenization?</h3>
+                <p className="text-gray-300">
+                    GPT-2 can't process raw text - it needs numbers. <strong>Tokenization</strong> converts text into a sequence of tokens (subword units).
+                </p>
+                <p className="text-gray-300">
+                    GPT-2 uses <strong>Byte-Pair Encoding (BPE)</strong> with a vocabulary of 50,257 tokens. This allows it to:
+                </p>
+                <ul className="list-disc list-inside space-y-1 text-gray-300 ml-4">
+                    <li>Handle any text (including rare words)</li>
+                    <li>Break unknown words into known subwords</li>
+                    <li>Keep common words as single tokens</li>
+                </ul>
+            </div>
+
+            {/* Interactive Demo */}
+            <div className="bg-gray-800 rounded-lg p-6 space-y-4">
+                <h3 className="text-xl font-semibold text-emerald-400">Try it Yourself</h3>
+                <div>
+                    <label className="block text-sm text-gray-400 mb-2">Enter text:</label>
+                    <input
+                        type="text"
+                        value={inputText}
+                        onChange={(e) => setInputText(e.target.value)}
+                        className="w-full bg-gray-700 text-white px-4 py-2 rounded border border-gray-600 focus:border-emerald-500 focus:outline-none"
+                        placeholder="Type anything..."
+                    />
+                </div>
+                <button
+                    onClick={() => tokenize(inputText)}
+                    className="px-6 py-2 bg-emerald-600 hover:bg-emerald-700 rounded font-semibold transition-colors"
+                >
+                    Tokenize
+                </button>
+
+                {tokens.length > 0 && (
+                    <div className="mt-4">
+                        <div className="text-sm text-gray-400 mb-2">Tokens ({tokens.length}):</div>
+                        <div className="flex flex-wrap gap-2">
+                            {tokens.map((token, i) => (
+                                <div key={i} className="bg-emerald-900 text-emerald-100 px-3 py-1 rounded text-sm font-mono">
+                                    {token}
+                                </div>
+                            ))}
+                        </div>
+                    </div>
+                )}
+            </div>
+
+            {/* Embedding Explanation */}
+            <div className="bg-gray-800 rounded-lg p-6 space-y-4">
+                <h3 className="text-xl font-semibold text-emerald-400">Token Embeddings</h3>
+                <p className="text-gray-300">
+                    Each token is converted to a <strong>learned embedding vector</strong> of size 768 (for GPT-2 Small).
+                </p>
+                <div className="bg-gray-900 p-4 rounded font-mono text-sm text-gray-300">
+                    Token "Hello" → Token ID: 15496 → Embedding: [0.23, -0.45, 0.12, ..., 0.67] (768 dimensions)
+                </div>
+                <p className="text-gray-300">
+                    These embeddings are <strong>learned during training</strong> so that similar tokens have similar vectors.
+                </p>
+            </div>
+
+            {/* Exercise */}
+            <div className="bg-blue-900 bg-opacity-30 border border-blue-700 rounded-lg p-6 space-y-4">
+                <h3 className="text-xl font-semibold text-blue-400">📝 Exercise</h3>
+                <p className="text-gray-300">
+                    Why does GPT-2 use Byte-Pair Encoding instead of word-level tokenization?
+                </p>
+                <textarea
+                    value={quizAnswer}
+                    onChange={(e) => setQuizAnswer(e.target.value)}
+                    className="w-full bg-gray-700 text-white px-4 py-2 rounded border border-gray-600 focus:border-blue-500 focus:outline-none h-24"
+                    placeholder="Your answer..."
+                />
+                <button
+                    onClick={checkQuiz}
+                    className="px-6 py-2 bg-blue-600 hover:bg-blue-700 rounded font-semibold transition-colors"
+                >
+                    Check Answer
+                </button>
+                {quizFeedback && (
+                    <div className={`p-3 rounded ${quizFeedback.startsWith('✓') ? 'bg-green-900 text-green-200' : 'bg-red-900 text-red-200'}`}>
+                        {quizFeedback}
+                    </div>
+                )}
+            </div>
+
+            {/* Navigation */}
+            <div className="flex justify-end">
+                <button
+                    onClick={onNext}
+                    className="px-6 py-3 bg-emerald-600 hover:bg-emerald-700 rounded font-semibold transition-colors"
+                >
+                    Next: Positional Encoding →
+                </button>
+            </div>
+        </div>
+    );
+}