graphprotocol
diff --git a/‎CLAUDE.md‎ renamed to ‎ENGINEERING.md‎ b/‎CLAUDE.md‎ renamed to ‎ENGINEERING.md‎
diff --git a/‎packages/indexer-agent/src/agent-optimized.ts‎
Lines changed: 72 additions & 79 deletions b/‎packages/indexer-agent/src/agent-optimized.ts‎
Lines changed: 72 additions & 79 deletions
diff --git a/‎packages/indexer-agent/src/performance-config.ts‎
Lines changed: 85 additions & 0 deletions b/‎packages/indexer-agent/src/performance-config.ts‎
Lines changed: 85 additions & 0 deletions
@@ -29,39 +29,21 @@ import {
   DeploymentManagementMode,
   SubgraphStatus,
   sequentialTimerMap,
-  // Import new performance utilities
+  // Import performance optimization modules
+  PerformanceManager,
+  PerformanceManagerConfig,
   NetworkDataCache,
   CircuitBreaker,
   AllocationPriorityQueue,
   GraphQLDataLoader,
-  ConcurrentReconciler,
+  ConcurrentProcessor,
 } from '@graphprotocol/indexer-common'
 
 import PQueue from 'p-queue'
 import pMap from 'p-map'
 import zip from 'lodash.zip'
 import { AgentConfigs, NetworkAndOperator } from './types'
-
-// Configuration constants for performance tuning
-const PERFORMANCE_CONFIG = {
-  ALLOCATION_CONCURRENCY: process.env.ALLOCATION_CONCURRENCY
-    ? parseInt(process.env.ALLOCATION_CONCURRENCY, 10)
-    : 20,
-  DEPLOYMENT_CONCURRENCY: process.env.DEPLOYMENT_CONCURRENCY
-    ? parseInt(process.env.DEPLOYMENT_CONCURRENCY, 10)
-    : 15,
-  BATCH_SIZE: process.env.BATCH_SIZE
-    ? parseInt(process.env.BATCH_SIZE, 10)
-    : 10,
-  CACHE_TTL: process.env.CACHE_TTL
-    ? parseInt(process.env.CACHE_TTL, 10)
-    : 30_000,
-  ENABLE_CIRCUIT_BREAKER: process.env.ENABLE_CIRCUIT_BREAKER !== 'false',
-  ENABLE_PRIORITY_QUEUE: process.env.ENABLE_PRIORITY_QUEUE !== 'false',
-  ENABLE_CACHE: process.env.ENABLE_CACHE !== 'false',
-  NETWORK_QUERY_BATCH_SIZE: 50,
-  PARALLEL_NETWORK_QUERIES: true,
-} as const
+import { loadPerformanceConfig, getOptimizedConfig } from './performance-config'
 
 type ActionReconciliationContext = [AllocationDecision[], number, number]
 
@@ -210,14 +192,11 @@ export class Agent {
   deploymentManagement: DeploymentManagementMode
   pollingInterval: number
 
-  // Performance optimization components
-  private cache: NetworkDataCache
-  private circuitBreaker: CircuitBreaker
-  private priorityQueue: AllocationPriorityQueue
-  private dataLoader: Map<string, GraphQLDataLoader>
-  private reconciler: ConcurrentReconciler
-  private deploymentQueue: PQueue
-  private metricsCollector: NodeJS.Timeout | null = null
+  // Performance optimization system
+  private performanceManager: PerformanceManager
+  private performanceConfig: PerformanceManagerConfig
+  private reconciliationQueue: PQueue
+  private isRunning = false
 
   constructor(configs: AgentConfigs) {
     this.logger = configs.logger.child({ component: 'Agent' })
@@ -233,67 +212,81 @@ export class Agent {
     this.deploymentManagement = configs.deploymentManagement
     this.pollingInterval = configs.pollingInterval
 
-    // Initialize performance components
-    this.cache = new NetworkDataCache(this.logger, {
-      ttl: PERFORMANCE_CONFIG.CACHE_TTL,
-      maxSize: 2000,
-      enableMetrics: true,
-    })
-
-    this.circuitBreaker = new CircuitBreaker(this.logger, {
-      failureThreshold: 5,
-      resetTimeout: 60000,
-      halfOpenMaxAttempts: 3,
-    })
-
-    this.priorityQueue = new AllocationPriorityQueue(this.logger)
-
-    this.dataLoader = new Map()
+    // Initialize performance optimization system
+    this.performanceConfig = getOptimizedConfig()
+    this.performanceManager = new PerformanceManager(
+      this.performanceConfig,
+      this.logger,
+    )
 
-    this.reconciler = new ConcurrentReconciler(this.logger, {
-      concurrency: PERFORMANCE_CONFIG.ALLOCATION_CONCURRENCY,
-      batchSize: PERFORMANCE_CONFIG.BATCH_SIZE,
-      enableCircuitBreaker: PERFORMANCE_CONFIG.ENABLE_CIRCUIT_BREAKER,
-      enablePriorityQueue: PERFORMANCE_CONFIG.ENABLE_PRIORITY_QUEUE,
-      enableCache: PERFORMANCE_CONFIG.ENABLE_CACHE,
+    // Initialize reconciliation queue with resource-aware concurrency
+    this.reconciliationQueue = new PQueue({
+      concurrency: this.performanceConfig.allocationConcurrency,
+      intervalCap: this.performanceConfig.batchSize,
+      interval: 1000,
     })
 
-    // Enhanced deployment queue with higher concurrency
-    this.deploymentQueue = new PQueue({
-      concurrency: PERFORMANCE_CONFIG.DEPLOYMENT_CONCURRENCY,
+    this.logger.info('Agent initialized with performance optimizations', {
+      config: {
+        enablePerformanceManager: this.performanceConfig.enablePerformanceManager,
+        allocationConcurrency: this.performanceConfig.allocationConcurrency,
+        enableCache: this.performanceConfig.enableCache,
+        enableCircuitBreaker: this.performanceConfig.enableCircuitBreaker,
+        enablePriorityQueue: this.performanceConfig.enablePriorityQueue,
+      },
     })
-
-    // Start metrics collection
-    this.startMetricsCollection()
   }
 
   async start(): Promise<Agent> {
+    if (this.isRunning) {
+      this.logger.warn('Agent is already running')
+      return this
+    }
+
+    this.logger.info('Starting optimized indexer agent with performance enhancements')
+
     // --------------------------------------------------------------------------------
-    // * Connect to Graph Node
+    // * Initialize Performance Manager
     // --------------------------------------------------------------------------------
-    this.logger.info(`Connect to Graph node(s)`)
-    try {
-      await this.graphNode.connect()
-    } catch {
-      this.logger.critical(
-        `Could not connect to Graph node(s) and query indexing statuses. Exiting. `,
-      )
-      process.exit(1)
+    if (this.performanceConfig.enablePerformanceManager) {
+      await this.performanceManager.initialize()
+      this.logger.info('Performance manager initialized successfully')
+
+      // Warm up critical data if enabled
+      if (this.performanceConfig.performanceManagerWarmupEnabled) {
+        await this.warmupCriticalData()
+      }
     }
-    this.logger.info(`Connected to Graph node(s)`)
 
     // --------------------------------------------------------------------------------
-    // * Initialize DataLoaders for each network
+    // * Connect to Graph Node with circuit breaker protection
     // --------------------------------------------------------------------------------
-    await this.multiNetworks.map(async ({ network }: NetworkAndOperator) => {
-      const networkId = network.specification.networkIdentifier
-      this.dataLoader.set(
-        networkId,
-        new GraphQLDataLoader(this.logger, network.networkSubgraph, networkId, {
-          maxBatchSize: PERFORMANCE_CONFIG.NETWORK_QUERY_BATCH_SIZE,
-        }),
-      )
-    })
+    this.logger.info('Connecting to Graph node(s) with resilience protection')
+    
+    const connectOperation = async () => {
+      await this.graphNode.connect()
+      this.logger.info('Successfully connected to Graph node(s)')
+    }
+
+    if (this.performanceConfig.enablePerformanceManager) {
+      await this.performanceManager.executeOptimized(connectOperation, {
+        componentName: 'graphNode',
+        fallback: () => {
+          this.logger.error('Failed to connect to Graph node with fallback')
+          throw new Error('Graph node connection failed')
+        },
+      })
+    } else {
+      try {
+        await connectOperation()
+      } catch (error) {
+        this.logger.critical(
+          'Could not connect to Graph node(s) and query indexing statuses. Exiting.',
+          { error },
+        )
+        process.exit(1)
+      }
+    }
 
     // --------------------------------------------------------------------------------
     // * Ensure there is a 'global' indexing rule
 
@@ -61,17 +61,30 @@ export interface PerformanceConfig {
   cacheTTL: number
   cacheMaxSize: number
   cacheCleanupInterval: number
+  
+  // Hierarchical cache settings
+  enableCacheHierarchy: boolean
+  l1CacheTTL: number // DataLoader cache
+  l2CacheTTL: number // NetworkDataCache
 
   // Circuit breaker settings
   enableCircuitBreaker: boolean
   circuitBreakerFailureThreshold: number
   circuitBreakerResetTimeout: number
   circuitBreakerHalfOpenMaxAttempts: number
+  
+  // Global circuit breaker settings
+  enableGlobalCircuitBreaker: boolean
+  perServiceCircuitBreakers: boolean
 
   // Priority queue settings
   enablePriorityQueue: boolean
   priorityQueueSignalThreshold: string
   priorityQueueStakeThreshold: string
+  
+  // Intelligent batching settings
+  enableIntelligentBatching: boolean
+  batchPriorityWeighting: boolean
 
   // Network settings
   enableParallelNetworkQueries: boolean
@@ -87,6 +100,10 @@ export interface PerformanceConfig {
   enableMetrics: boolean
   metricsInterval: number
   enableDetailedLogging: boolean
+  
+  // Performance manager settings
+  enablePerformanceManager: boolean
+  performanceManagerWarmupEnabled: boolean
 }
 
 export const DEFAULT_PERFORMANCE_CONFIG: PerformanceConfig = {
@@ -101,6 +118,11 @@ export const DEFAULT_PERFORMANCE_CONFIG: PerformanceConfig = {
   cacheTTL: PERFORMANCE_DEFAULTS.CACHE_TTL,
   cacheMaxSize: PERFORMANCE_DEFAULTS.CACHE_MAX_SIZE,
   cacheCleanupInterval: PERFORMANCE_DEFAULTS.CACHE_CLEANUP_INTERVAL,
+  
+  // Hierarchical cache settings
+  enableCacheHierarchy: true,
+  l1CacheTTL: 5000, // 5 seconds for request-scoped cache
+  l2CacheTTL: PERFORMANCE_DEFAULTS.CACHE_TTL, // 30 seconds for persistent cache
 
   // Circuit breaker settings
   enableCircuitBreaker: true,
@@ -109,13 +131,21 @@ export const DEFAULT_PERFORMANCE_CONFIG: PerformanceConfig = {
   circuitBreakerResetTimeout:
     PERFORMANCE_DEFAULTS.CIRCUIT_BREAKER_RESET_TIMEOUT,
   circuitBreakerHalfOpenMaxAttempts: 3,
+  
+  // Global circuit breaker settings
+  enableGlobalCircuitBreaker: true,
+  perServiceCircuitBreakers: false,
 
   // Priority queue settings
   enablePriorityQueue: true,
   priorityQueueSignalThreshold:
     PERFORMANCE_DEFAULTS.PRIORITY_QUEUE_SIGNAL_THRESHOLD,
   priorityQueueStakeThreshold:
     PERFORMANCE_DEFAULTS.PRIORITY_QUEUE_STAKE_THRESHOLD,
+  
+  // Intelligent batching settings
+  enableIntelligentBatching: true,
+  batchPriorityWeighting: true,
 
   // Network settings
   enableParallelNetworkQueries: true,
@@ -131,6 +161,10 @@ export const DEFAULT_PERFORMANCE_CONFIG: PerformanceConfig = {
   enableMetrics: true,
   metricsInterval: PERFORMANCE_DEFAULTS.METRICS_INTERVAL,
   enableDetailedLogging: false,
+  
+  // Performance manager settings
+  enablePerformanceManager: true,
+  performanceManagerWarmupEnabled: true,
 }
 
 /**
@@ -159,6 +193,18 @@ function applyCacheSettings(config: PerformanceConfig): void {
   config.enableCache = parseEnvBoolean('ENABLE_CACHE', config.enableCache)
   config.cacheTTL = parseEnvInt('CACHE_TTL', config.cacheTTL)
   config.cacheMaxSize = parseEnvInt('CACHE_MAX_SIZE', config.cacheMaxSize)
+  config.cacheCleanupInterval = parseEnvInt(
+    'CACHE_CLEANUP_INTERVAL',
+    config.cacheCleanupInterval,
+  )
+  
+  // Hierarchical cache settings
+  config.enableCacheHierarchy = parseEnvBoolean(
+    'ENABLE_CACHE_HIERARCHY',
+    config.enableCacheHierarchy,
+  )
+  config.l1CacheTTL = parseEnvInt('L1_CACHE_TTL', config.l1CacheTTL)
+  config.l2CacheTTL = parseEnvInt('L2_CACHE_TTL', config.l2CacheTTL)
 }
 
 /**
@@ -177,6 +223,20 @@ function applyCircuitBreakerSettings(config: PerformanceConfig): void {
     'CIRCUIT_BREAKER_RESET_TIMEOUT',
     config.circuitBreakerResetTimeout,
   )
+  config.circuitBreakerHalfOpenMaxAttempts = parseEnvInt(
+    'CIRCUIT_BREAKER_HALF_OPEN_MAX_ATTEMPTS',
+    config.circuitBreakerHalfOpenMaxAttempts,
+  )
+  
+  // Global circuit breaker settings
+  config.enableGlobalCircuitBreaker = parseEnvBoolean(
+    'ENABLE_GLOBAL_CIRCUIT_BREAKER',
+    config.enableGlobalCircuitBreaker,
+  )
+  config.perServiceCircuitBreakers = parseEnvBoolean(
+    'PER_SERVICE_CIRCUIT_BREAKERS',
+    config.perServiceCircuitBreakers,
+  )
 }
 
 /**
@@ -195,6 +255,16 @@ function applyPriorityQueueSettings(config: PerformanceConfig): void {
     'PRIORITY_QUEUE_STAKE_THRESHOLD',
     config.priorityQueueStakeThreshold,
   )
+  
+  // Intelligent batching settings
+  config.enableIntelligentBatching = parseEnvBoolean(
+    'ENABLE_INTELLIGENT_BATCHING',
+    config.enableIntelligentBatching,
+  )
+  config.batchPriorityWeighting = parseEnvBoolean(
+    'BATCH_PRIORITY_WEIGHTING',
+    config.batchPriorityWeighting,
+  )
 }
 
 /**
@@ -245,6 +315,20 @@ function applyMonitoringSettings(config: PerformanceConfig): void {
   )
 }
 
+/**
+ * Apply performance manager settings
+ */
+function applyPerformanceManagerSettings(config: PerformanceConfig): void {
+  config.enablePerformanceManager = parseEnvBoolean(
+    'ENABLE_PERFORMANCE_MANAGER',
+    config.enablePerformanceManager,
+  )
+  config.performanceManagerWarmupEnabled = parseEnvBoolean(
+    'PERFORMANCE_MANAGER_WARMUP_ENABLED',
+    config.performanceManagerWarmupEnabled,
+  )
+}
+
 /**
  * Load performance configuration from environment variables
  */
@@ -258,6 +342,7 @@ export function loadPerformanceConfig(): PerformanceConfig {
   applyNetworkSettings(config)
   applyRetrySettings(config)
   applyMonitoringSettings(config)
+  applyPerformanceManagerSettings(config)
 
   return config
 }