JavaZeroo
diff --git a/‎.github/workflows/ci.yml‎
Lines changed: 16 additions & 1 deletion b/‎.github/workflows/ci.yml‎
Lines changed: 16 additions & 1 deletion
diff --git a/‎package.json‎
Lines changed: 2 additions & 1 deletion b/‎package.json‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎public/locales/en/translation.json‎
Lines changed: 3 additions & 0 deletions b/‎public/locales/en/translation.json‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎public/locales/zh/translation.json‎
Lines changed: 3 additions & 0 deletions b/‎public/locales/zh/translation.json‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎scripts/generate-test-file.js‎
Lines changed: 35 additions & 0 deletions b/‎scripts/generate-test-file.js‎
Lines changed: 35 additions & 0 deletions
diff --git a/‎scripts/stress-test.js‎
Lines changed: 155 additions & 0 deletions b/‎scripts/stress-test.js‎
Lines changed: 155 additions & 0 deletions
diff --git a/‎src/App.jsx‎
Lines changed: 37 additions & 9 deletions b/‎src/App.jsx‎
Lines changed: 37 additions & 9 deletions
@@ -3,7 +3,7 @@ name: CI
 on:
   pull_request:
   push:
-    branches: [ main ]
+    branches: [ main, master ]
 
 jobs:
   test:
@@ -15,6 +15,21 @@ jobs:
           node-version: '20'
           cache: 'npm'
       - run: npm install
+      - run: npm run lint
       - run: npm test
         env:
           CI: true
+
+  stress-test:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+      - uses: actions/setup-node@v4
+        with:
+          node-version: '20'
+          cache: 'npm'
+      - run: npm install
+      - name: Run stress test (10K - 1M lines)
+        run: npm run test:stress
+        env:
+          NODE_OPTIONS: '--max-old-space-size=4096'
@@ -10,7 +10,8 @@
     "build": "vite build",
     "lint": "eslint .",
     "preview": "vite preview",
-    "test": "vitest run --coverage"
+    "test": "vitest run --coverage",
+    "test:stress": "node scripts/stress-test.js"
   },
   "dependencies": {
     "@tailwindcss/forms": "^0.5.10",
 
@@ -12,6 +12,9 @@
   "fileList.disabled": "Disabled",
   "fileList.config": "Configure file {{name}}",
   "fileList.delete": "Remove file {{name}}",
+  "fileList.parsing": "Parsing",
+  "fileList.needsReupload": "Large file - re-upload required to re-parse",
+  "fileList.needsReuploadTip": "File data is cached, but re-upload is required to modify parsing config",
   "comparison.title": "Compare Mode",
   "comparison.select": "Select comparison mode",
   "comparison.multiFileMode": "Multi-file comparison mode",
 
@@ -12,6 +12,9 @@
   "fileList.disabled": "已禁用",
   "fileList.config": "配置文件 {{name}}",
   "fileList.delete": "删除文件 {{name}}",
+  "fileList.parsing": "解析中",
+  "fileList.needsReupload": "大文件 - 需要重新上传才能重新解析",
+  "fileList.needsReuploadTip": "此文件数据已缓存，但需要重新上传才能修改解析配置",
   "comparison.title": "对比模式",
   "comparison.select": "选择数据对比模式",
   "comparison.multiFileMode": "多文件对比模式",
 
@@ -0,0 +1,35 @@
+/**
+ * Generate test log file for browser testing
+ * Run with: node scripts/generate-test-file.js [lines]
+ * Example: node scripts/generate-test-file.js 100000
+ */
+
+import fs from 'fs';
+import path from 'path';
+import { fileURLToPath } from 'url';
+
+const __dirname = path.dirname(fileURLToPath(import.meta.url));
+
+const numLines = parseInt(process.argv[2]) || 100000;
+
+console.log(`\n📝 Generating test file with ${numLines.toLocaleString()} lines...`);
+
+const lines = [];
+for (let i = 0; i < numLines; i++) {
+  const step = i;
+  const loss = Math.random() * 2 + Math.exp(-i / 10000);
+  const gradNorm = Math.random() * 0.5 + 0.1;
+  lines.push(`step: ${step} | loss: ${loss.toFixed(6)} | grad_norm: ${gradNorm.toFixed(6)}`);
+}
+
+const content = lines.join('\n');
+const outputPath = path.join(__dirname, `test-${numLines}.log`);
+
+fs.writeFileSync(outputPath, content);
+
+const stats = fs.statSync(outputPath);
+const sizeMB = (stats.size / 1024 / 1024).toFixed(2);
+
+console.log(`✓ Created: ${outputPath}`);
+console.log(`✓ Size: ${sizeMB} MB`);
+console.log(`\n📌 Drag this file into the Log Analyzer to test!`);
@@ -0,0 +1,155 @@
+/**
+ * Stress test for large file handling
+ * Run with: node scripts/stress-test.js
+ */
+
+import { ValueExtractor } from '../src/utils/ValueExtractor.js';
+
+// Generate a large test log file
+function generateTestLog(numLines) {
+  console.log(`\n📝 Generating ${numLines.toLocaleString()} lines of test data...`);
+  const startTime = Date.now();
+
+  const lines = [];
+  for (let i = 0; i < numLines; i++) {
+    const step = i;
+    const loss = Math.random() * 2 + Math.exp(-i / 10000); // Decreasing loss with noise
+    const gradNorm = Math.random() * 0.5 + 0.1;
+    lines.push(`step: ${step} | loss: ${loss.toFixed(6)} | grad_norm: ${gradNorm.toFixed(6)}`);
+  }
+
+  const content = lines.join('\n');
+  const elapsed = Date.now() - startTime;
+  const sizeBytes = Buffer.byteLength(content, 'utf8');
+  const sizeMB = (sizeBytes / 1024 / 1024).toFixed(2);
+
+  console.log(`   ✓ Generated in ${elapsed}ms`);
+  console.log(`   ✓ Size: ${sizeMB} MB (${sizeBytes.toLocaleString()} bytes)`);
+
+  return { content, sizeBytes };
+}
+
+// Test ValueExtractor performance
+function testValueExtractor(content) {
+  console.log('\n🔍 Testing ValueExtractor...');
+
+  // Test 1: String input (old way - splits every time)
+  console.log('\n   Test 1: extractByKeyword with string input');
+  let start = Date.now();
+  const result1 = ValueExtractor.extractByKeyword(content, 'loss:');
+  let elapsed = Date.now() - start;
+  console.log(`   ✓ Found ${result1.length.toLocaleString()} matches in ${elapsed}ms`);
+
+  // Test 2: Pre-split lines (optimized way)
+  console.log('\n   Test 2: extractByKeyword with pre-split lines');
+  start = Date.now();
+  const lines = content.split('\n');
+  const splitTime = Date.now() - start;
+  console.log(`   ✓ Split into ${lines.length.toLocaleString()} lines in ${splitTime}ms`);
+
+  start = Date.now();
+  const result2 = ValueExtractor.extractByKeyword(lines, 'loss:');
+  elapsed = Date.now() - start;
+  console.log(`   ✓ Found ${result2.length.toLocaleString()} matches in ${elapsed}ms`);
+
+  // Test 3: Multiple metrics with pre-split lines
+  console.log('\n   Test 3: Multiple metrics with pre-split lines (simulates worker)');
+  start = Date.now();
+  const lossResults = ValueExtractor.extractByKeyword(lines, 'loss:');
+  const gradResults = ValueExtractor.extractByKeyword(lines, 'grad_norm:');
+  elapsed = Date.now() - start;
+  console.log(`   ✓ Loss: ${lossResults.length.toLocaleString()} matches`);
+  console.log(`   ✓ Grad Norm: ${gradResults.length.toLocaleString()} matches`);
+  console.log(`   ✓ Total time: ${elapsed}ms`);
+
+  // Verify data integrity
+  console.log('\n   Verifying data integrity...');
+  if (result1.length === result2.length) {
+    console.log(`   ✓ Match counts are equal: ${result1.length}`);
+  } else {
+    console.log(`   ✗ ERROR: Match counts differ! ${result1.length} vs ${result2.length}`);
+  }
+
+  return { lossResults, gradResults, lines };
+}
+
+// Test memory usage
+function testMemoryUsage(label) {
+  const used = process.memoryUsage();
+  console.log(`\n📊 Memory Usage (${label}):`);
+  console.log(`   Heap Used: ${(used.heapUsed / 1024 / 1024).toFixed(2)} MB`);
+  console.log(`   Heap Total: ${(used.heapTotal / 1024 / 1024).toFixed(2)} MB`);
+  console.log(`   RSS: ${(used.rss / 1024 / 1024).toFixed(2)} MB`);
+  return used;
+}
+
+// Main test runner
+async function runStressTest() {
+  console.log('═'.repeat(60));
+  console.log('🚀 STRESS TEST FOR LARGE FILE HANDLING');
+  console.log('═'.repeat(60));
+
+  const testCases = [
+    { lines: 10000, name: '10K lines' },
+    { lines: 50000, name: '50K lines' },
+    { lines: 100000, name: '100K lines' },
+    { lines: 500000, name: '500K lines' },
+    { lines: 1000000, name: '1M lines' },
+  ];
+
+  testMemoryUsage('Initial');
+
+  for (const testCase of testCases) {
+    console.log('\n' + '─'.repeat(60));
+    console.log(`📋 TEST CASE: ${testCase.name}`);
+    console.log('─'.repeat(60));
+
+    // Generate test data
+    const { content, sizeBytes } = generateTestLog(testCase.lines);
+
+    // Check if this would be considered a "large file"
+    const LARGE_FILE_THRESHOLD = 5 * 1024 * 1024; // 5MB
+    const isLargeFile = sizeBytes > LARGE_FILE_THRESHOLD;
+    console.log(`\n   Large file threshold: ${isLargeFile ? '⚠️  EXCEEDS' : '✓ Within'} (${(LARGE_FILE_THRESHOLD / 1024 / 1024).toFixed(0)}MB)`);
+
+    // Test ValueExtractor
+    const { lossResults, gradResults } = testValueExtractor(content);
+
+    // Memory after processing
+    testMemoryUsage('After processing');
+
+    // Summary
+    console.log('\n📈 Results Summary:');
+    console.log(`   Lines processed: ${testCase.lines.toLocaleString()}`);
+    console.log(`   Loss data points: ${lossResults.length.toLocaleString()}`);
+    console.log(`   Grad norm data points: ${gradResults.length.toLocaleString()}`);
+
+    // Verify first and last values
+    if (lossResults.length > 0) {
+      console.log(`   First loss value: ${lossResults[0].value.toFixed(6)} (line ${lossResults[0].line})`);
+      console.log(`   Last loss value: ${lossResults[lossResults.length - 1].value.toFixed(6)} (line ${lossResults[lossResults.length - 1].line})`);
+    }
+
+    // Force GC if available
+    if (global.gc) {
+      global.gc();
+      console.log('\n   🧹 Garbage collection triggered');
+    }
+  }
+
+  console.log('\n' + '═'.repeat(60));
+  console.log('✅ STRESS TEST COMPLETE');
+  console.log('═'.repeat(60));
+
+  testMemoryUsage('Final');
+}
+
+// Run the test
+runStressTest()
+  .then(() => {
+    process.exit(0);
+  })
+  .catch((error) => {
+    console.error('❌ Stress test failed:', error);
+    process.exit(1);
+  });
@@ -11,6 +11,9 @@ import { Header } from './components/Header';
 import { PanelLeftClose, PanelLeftOpen } from 'lucide-react';
 import { mergeFilesWithReplacement } from './utils/mergeFiles.js';
 
+// Threshold for "large file" - files above this won't have content persisted
+const LARGE_FILE_THRESHOLD = 5 * 1024 * 1024; // 5MB of content
+
 // Default global parsing configuration
 export const DEFAULT_GLOBAL_PARSING_CONFIG = {
   metrics: [
@@ -35,7 +38,22 @@ function App() {
   const { t } = useTranslation();
   const [uploadedFiles, setUploadedFiles] = useState(() => {
     const stored = localStorage.getItem('uploadedFiles');
-    return stored ? JSON.parse(stored) : [];
+    if (!stored) return [];
+    try {
+      const parsed = JSON.parse(stored);
+      // Restore files with proper defaults for large files that have metricsData
+      return parsed.map(file => ({
+        ...file,
+        enabled: file.enabled ?? true,
+        isParsing: false,
+        // For large files, metricsData is already stored; for small files it will be re-parsed
+        metricsData: file.metricsData || {},
+        // Mark large files that need re-upload for re-parsing
+        needsReupload: file.isLargeFile && !file.content
+      }));
+    } catch {
+      return [];
+    }
   });
 
   // Global parsing configuration state
@@ -118,16 +136,26 @@ function App() {
   useEffect(() => {
     if (savingDisabledRef.current) return;
     try {
-      const serialized = uploadedFiles.map(({ id, name, enabled, content, config }) => ({
-        id,
-        name,
-        enabled,
-        content,
-        config
-      }));
+      // Smart serialization: for large files, only store metricsData (not raw content)
+      // This allows the app to still display charts after refresh, but re-parsing will need re-upload
+      const serialized = uploadedFiles.map(({ id, name, enabled, content, config, metricsData }) => {
+        const isLargeFile = content && content.length > LARGE_FILE_THRESHOLD;
+        return {
+          id,
+          name,
+          enabled,
+          // For large files, don't store content to save memory/storage
+          content: isLargeFile ? null : content,
+          config,
+          // Store metricsData for large files so charts still work after refresh
+          metricsData: isLargeFile ? metricsData : undefined,
+          // Flag to indicate this file needs re-upload for re-parsing
+          isLargeFile
+        };
+      });
       if (serialized.length > 0) {
         const json = JSON.stringify(serialized);
-        // Avoid filling localStorage with very large files
+        // Avoid filling localStorage with very large data
         if (json.length > 5 * 1024 * 1024) {
           savingDisabledRef.current = true;
           console.warn('Uploaded files exceed storage limit; persistence disabled.');