Merge commit 'd803bfe2b1fe7f5e219e50ac20d6801a0a58ac75' as 'vendor/ruvector'

2026-02-28 14:39:40 -05:00
parent 7885bf6278 d803bfe2b1
commit cd5943df23
7854 changed files with 3522914 additions and 0 deletions
--- a/vendor/ruvector/npm/packages/cloud-run/streaming-service-optimized.ts
+++ b/vendor/ruvector/npm/packages/cloud-run/streaming-service-optimized.ts
@@ -0,0 +1,552 @@
+import Fastify from 'fastify';
+import helmet from '@fastify/helmet';
+import compress from '@fastify/compress';
+import rateLimit from '@fastify/rate-limit';
+import websocket from '@fastify/websocket';
+import { VectorClient } from './vector-client';
+import { LoadBalancer } from './load-balancer';
+import { trace, metrics } from '@opentelemetry/api';
+import EventEmitter from 'events';
+
+// ===== ADVANCED OPTIMIZATIONS =====
+
+// 1. ADAPTIVE BATCHING WITH PRIORITY QUEUES
+class AdaptiveBatcher extends EventEmitter {
+  private queues: Map<string, Array<any>> = new Map();
+  private timers: Map<string, NodeJS.Timeout> = new Map();
+  private batchSizes: Map<string, number> = new Map();
+
+  // Dynamic batch size based on load
+  private readonly MIN_BATCH = 10;
+  private readonly MAX_BATCH = 500;
+  private readonly TARGET_LATENCY_MS = 5;
+
+  constructor() {
+    super();
+    // Initialize priority queues
+    ['critical', 'high', 'normal', 'low'].forEach(priority => {
+      this.queues.set(priority, []);
+      this.batchSizes.set(priority, 50);
+    });
+
+    // Adaptive tuning every 10 seconds
+    setInterval(() => this.tuneParameters(), 10000);
+  }
+
+  async add(item: any, priority: string = 'normal'): Promise<any> {
+    const queue = this.queues.get(priority) || this.queues.get('normal')!;
+
+    return new Promise((resolve, reject) => {
+      queue.push({ ...item, resolve, reject, addedAt: Date.now() });
+
+      const batchSize = this.batchSizes.get(priority) || 50;
+
+      if (queue.length >= batchSize) {
+        this.flush(priority);
+      } else if (!this.timers.has(priority)) {
+        // Dynamic timeout based on queue length
+        const timeout = Math.max(1, this.TARGET_LATENCY_MS - queue.length);
+        this.timers.set(priority, setTimeout(() => this.flush(priority), timeout));
+      }
+    });
+  }
+
+  private async flush(priority: string) {
+    const queue = this.queues.get(priority);
+    if (!queue || queue.length === 0) return;
+
+    const timer = this.timers.get(priority);
+    if (timer) {
+      clearTimeout(timer);
+      this.timers.delete(priority);
+    }
+
+    const batch = queue.splice(0, this.batchSizes.get(priority) || 50);
+    const startTime = Date.now();
+
+    try {
+      this.emit('batch', { priority, size: batch.length });
+      const results = await this.processBatch(batch.map(b => b.query));
+
+      results.forEach((result: any, i: number) => {
+        batch[i].resolve(result);
+      });
+
+      // Track latency for adaptive tuning
+      const latency = Date.now() - startTime;
+      this.emit('latency', { priority, latency, batchSize: batch.length });
+
+    } catch (error) {
+      batch.forEach(b => b.reject(error));
+    }
+  }
+
+  private async processBatch(queries: any[]): Promise<any[]> {
+    // Override in subclass
+    return queries;
+  }
+
+  private tuneParameters() {
+    // Adaptive batch size based on recent performance
+    this.queues.forEach((queue, priority) => {
+      const currentSize = this.batchSizes.get(priority) || 50;
+      const queueLength = queue.length;
+
+      let newSize = currentSize;
+
+      if (queueLength > currentSize * 2) {
+        // Queue backing up, increase batch size
+        newSize = Math.min(this.MAX_BATCH, currentSize * 1.2);
+      } else if (queueLength < currentSize * 0.3) {
+        // Queue empty, decrease batch size
+        newSize = Math.max(this.MIN_BATCH, currentSize * 0.8);
+      }
+
+      this.batchSizes.set(priority, Math.round(newSize));
+    });
+  }
+}
+
+// 2. MULTI-LEVEL CACHE WITH COMPRESSION
+class CompressedCache {
+  private l1: Map<string, any>;
+  private l2: any; // Redis
+  private compressionThreshold = 1024; // bytes
+
+  constructor(redis: any) {
+    this.l1 = new Map();
+    this.l2 = redis;
+
+    // LRU eviction for L1 every minute
+    setInterval(() => this.evictL1(), 60000);
+  }
+
+  async get(key: string): Promise<any> {
+    // Check L1 (in-memory)
+    if (this.l1.has(key)) {
+      return this.l1.get(key);
+    }
+
+    // Check L2 (Redis)
+    const compressed = await this.l2.getBuffer(key);
+    if (compressed) {
+      const value = await this.decompress(compressed);
+      // Promote to L1
+      this.l1.set(key, value);
+      return value;
+    }
+
+    return null;
+  }
+
+  async set(key: string, value: any, ttl: number = 3600): Promise<void> {
+    // Set L1
+    this.l1.set(key, value);
+
+    // Set L2 with compression for large values
+    const serialized = JSON.stringify(value);
+    const buffer = Buffer.from(serialized);
+
+    if (buffer.length > this.compressionThreshold) {
+      const compressed = await this.compress(buffer);
+      await this.l2.setex(key, ttl, compressed);
+    } else {
+      await this.l2.setex(key, ttl, serialized);
+    }
+  }
+
+  private async compress(buffer: Buffer): Promise<Buffer> {
+    const { promisify } = require('util');
+    const { brotliCompress } = require('zlib');
+    const compress = promisify(brotliCompress);
+    return compress(buffer);
+  }
+
+  private async decompress(buffer: Buffer): Promise<any> {
+    const { promisify } = require('util');
+    const { brotliDecompress } = require('zlib');
+    const decompress = promisify(brotliDecompress);
+    const decompressed = await decompress(buffer);
+    return JSON.parse(decompressed.toString());
+  }
+
+  private evictL1() {
+    if (this.l1.size > 10000) {
+      const toDelete = this.l1.size - 8000;
+      const keys = Array.from(this.l1.keys()).slice(0, toDelete);
+      keys.forEach(k => this.l1.delete(k));
+    }
+  }
+}
+
+// 3. CONNECTION POOLING WITH HEALTH CHECKS
+class AdvancedConnectionPool {
+  private pools: Map<string, any[]> = new Map();
+  private healthScores: Map<string, number> = new Map();
+  private readonly maxPerPool = 100;
+  private readonly minPerPool = 10;
+
+  constructor() {
+    // Health check every 30 seconds
+    setInterval(() => this.healthCheck(), 30000);
+  }
+
+  async acquire(poolId: string): Promise<any> {
+    let pool = this.pools.get(poolId);
+
+    if (!pool) {
+      pool = [];
+      this.pools.set(poolId, pool);
+      this.healthScores.set(poolId, 1.0);
+    }
+
+    // Try to get healthy connection
+    let connection = null;
+    while (pool.length > 0 && !connection) {
+      const candidate = pool.pop();
+      if (await this.isHealthy(candidate)) {
+        connection = candidate;
+      }
+    }
+
+    // Create new if needed
+    if (!connection) {
+      connection = await this.createConnection(poolId);
+    }
+
+    return connection;
+  }
+
+  async release(poolId: string, connection: any): Promise<void> {
+    const pool = this.pools.get(poolId);
+    if (pool && pool.length < this.maxPerPool) {
+      pool.push(connection);
+    } else {
+      await this.closeConnection(connection);
+    }
+  }
+
+  private async isHealthy(connection: any): Promise<boolean> {
+    try {
+      await connection.ping();
+      return true;
+    } catch {
+      return false;
+    }
+  }
+
+  private async healthCheck() {
+    for (const [poolId, pool] of this.pools) {
+      let healthy = 0;
+      for (const conn of pool) {
+        if (await this.isHealthy(conn)) {
+          healthy++;
+        }
+      }
+
+      const healthScore = pool.length > 0 ? healthy / pool.length : 1.0;
+      this.healthScores.set(poolId, healthScore);
+
+      // Maintain minimum pool size
+      while (pool.length < this.minPerPool) {
+        pool.push(await this.createConnection(poolId));
+      }
+    }
+  }
+
+  private async createConnection(poolId: string): Promise<any> {
+    // Override in subclass
+    return { poolId, id: Math.random() };
+  }
+
+  private async closeConnection(connection: any): Promise<void> {
+    // Override in subclass
+  }
+
+  getHealthScore(poolId: string): number {
+    return this.healthScores.get(poolId) || 0;
+  }
+}
+
+// 4. RESULT STREAMING WITH BACKPRESSURE
+class StreamingResponder {
+  private readonly maxBufferSize = 1000;
+
+  async streamResults(
+    query: any,
+    processor: AsyncGenerator<any>,
+    response: any
+  ): Promise<void> {
+    response.raw.setHeader('Content-Type', 'application/x-ndjson');
+    response.raw.setHeader('Cache-Control', 'no-cache');
+    response.raw.setHeader('X-Accel-Buffering', 'no'); // Disable nginx buffering
+
+    let bufferSize = 0;
+    let backpressure = false;
+
+    for await (const result of processor) {
+      // Check backpressure
+      if (!response.raw.write(JSON.stringify(result) + '\n')) {
+        backpressure = true;
+        await new Promise(resolve => response.raw.once('drain', resolve));
+        backpressure = false;
+      }
+
+      bufferSize++;
+
+      // Apply backpressure to source if buffer too large
+      if (bufferSize > this.maxBufferSize) {
+        await new Promise(resolve => setTimeout(resolve, 10));
+        bufferSize = Math.max(0, bufferSize - 100);
+      }
+    }
+
+    response.raw.end();
+  }
+}
+
+// 5. QUERY PLAN CACHE (for complex filters)
+class QueryPlanCache {
+  private cache: Map<string, any> = new Map();
+  private stats: Map<string, { hits: number, avgTime: number }> = new Map();
+
+  getPlan(filter: any): any | null {
+    const key = this.getKey(filter);
+    const plan = this.cache.get(key);
+
+    if (plan) {
+      const stat = this.stats.get(key) || { hits: 0, avgTime: 0 };
+      stat.hits++;
+      this.stats.set(key, stat);
+    }
+
+    return plan;
+  }
+
+  cachePlan(filter: any, plan: any, executionTime: number): void {
+    const key = this.getKey(filter);
+    this.cache.set(key, plan);
+
+    const stat = this.stats.get(key) || { hits: 0, avgTime: 0 };
+    stat.avgTime = (stat.avgTime * stat.hits + executionTime) / (stat.hits + 1);
+    this.stats.set(key, stat);
+
+    // Evict least valuable plans
+    if (this.cache.size > 1000) {
+      this.evictLowValue();
+    }
+  }
+
+  private getKey(filter: any): string {
+    return JSON.stringify(filter, Object.keys(filter).sort());
+  }
+
+  private evictLowValue() {
+    // Calculate value score: hits / avgTime
+    const scored = Array.from(this.stats.entries())
+      .map(([key, stat]) => ({
+        key,
+        score: stat.hits / (stat.avgTime + 1)
+      }))
+      .sort((a, b) => a.score - b.score);
+
+    // Remove bottom 20%
+    const toRemove = Math.floor(scored.length * 0.2);
+    for (let i = 0; i < toRemove; i++) {
+      this.cache.delete(scored[i].key);
+      this.stats.delete(scored[i].key);
+    }
+  }
+}
+
+// 6. OPTIMIZED MAIN SERVICE
+const fastify = Fastify({
+  logger: true,
+  trustProxy: true,
+  http2: true,
+  requestIdHeader: 'x-request-id',
+  requestIdLogLabel: 'reqId',
+  disableRequestLogging: true, // Custom logging for better performance
+  ignoreTrailingSlash: true,
+  maxParamLength: 500,
+  bodyLimit: 1048576, // 1MB
+  keepAliveTimeout: 65000, // Longer than ALB timeout
+  connectionTimeout: 70000,
+});
+
+// Register plugins
+fastify.register(helmet, {
+  contentSecurityPolicy: false,
+  global: true,
+});
+
+fastify.register(compress, {
+  global: true,
+  threshold: 1024,
+  encodings: ['br', 'gzip', 'deflate'],
+  brotliOptions: {
+    params: {
+      [require('zlib').constants.BROTLI_PARAM_MODE]: require('zlib').constants.BROTLI_MODE_TEXT,
+      [require('zlib').constants.BROTLI_PARAM_QUALITY]: 4, // Fast compression
+    }
+  },
+  zlibOptions: {
+    level: 6, // Balanced
+  }
+});
+
+// Redis-based rate limiting for distributed environment
+fastify.register(rateLimit, {
+  global: true,
+  max: 1000,
+  timeWindow: '1 minute',
+  cache: 10000,
+  allowList: ['127.0.0.1'],
+  redis: process.env.REDIS_URL ? require('ioredis').createClient(process.env.REDIS_URL) : undefined,
+  nameSpace: 'ruvector:ratelimit:',
+  continueExceeding: true,
+  enableDraftSpec: true,
+});
+
+fastify.register(websocket, {
+  options: {
+    maxPayload: 1048576,
+    clientTracking: true,
+    perMessageDeflate: {
+      zlibDeflateOptions: {
+        level: 6,
+      },
+      threshold: 1024,
+    }
+  }
+});
+
+// Initialize optimized components
+const vectorClient = new VectorClient({
+  host: process.env.RUVECTOR_HOST || 'localhost',
+  port: parseInt(process.env.RUVECTOR_PORT || '50051'),
+  maxConnections: parseInt(process.env.MAX_CONNECTIONS || '100'),
+  minConnections: parseInt(process.env.MIN_CONNECTIONS || '10'),
+  enableCache: true,
+  cacheTTL: 3600,
+});
+
+const loadBalancer = new LoadBalancer({
+  backends: (process.env.BACKEND_URLS || '').split(','),
+  healthCheckInterval: 30000,
+  circuitBreakerThreshold: 5,
+  circuitBreakerTimeout: 60000,
+});
+
+const batcher = new AdaptiveBatcher();
+const queryPlanCache = new QueryPlanCache();
+const streamer = new StreamingResponder();
+
+// Setup adaptive batching
+class VectorBatcher extends AdaptiveBatcher {
+  async processBatch(queries: any[]): Promise<any[]> {
+    return vectorClient.batchQuery(queries);
+  }
+}
+
+const vectorBatcher = new VectorBatcher();
+
+// Optimized batch query endpoint with plan caching
+fastify.post('/api/query/batch', async (request, reply) => {
+  const { queries, priority = 'normal' } = request.body as any;
+
+  const results = await Promise.all(
+    queries.map((query: any) => vectorBatcher.add(query, priority))
+  );
+
+  return { results, count: results.length };
+});
+
+// Streaming query with backpressure
+fastify.get('/api/query/stream', async (request, reply) => {
+  const { vector, topK = 10, filters } = request.query as any;
+
+  // Check query plan cache
+  let plan = filters ? queryPlanCache.getPlan(filters) : null;
+
+  async function* resultGenerator() {
+    const startTime = Date.now();
+
+    for await (const result of vectorClient.streamQuery({ vector, topK, filters, plan })) {
+      yield result;
+    }
+
+    // Cache the plan if it was efficient
+    if (filters && !plan) {
+      const executionTime = Date.now() - startTime;
+      queryPlanCache.cachePlan(filters, { ...filters, optimized: true }, executionTime);
+    }
+  }
+
+  await streamer.streamResults({ vector, topK, filters }, resultGenerator(), reply);
+});
+
+// Health endpoint with detailed status
+fastify.get('/health', async (request, reply) => {
+  const health = {
+    status: 'healthy',
+    timestamp: new Date().toISOString(),
+    uptime: process.uptime(),
+    memory: process.memoryUsage(),
+    connections: {
+      active: vectorClient.getActiveConnections(),
+      poolSize: vectorClient.getPoolSize(),
+    },
+    cache: {
+      hitRate: vectorClient.getCacheHitRate(),
+      size: vectorClient.getCacheSize(),
+    },
+    batcher: {
+      queueSizes: {},
+    },
+    loadBalancer: {
+      backends: loadBalancer.getBackendHealth(),
+    },
+  };
+
+  return health;
+});
+
+// Graceful shutdown
+const gracefulShutdown = async (signal: string) => {
+  console.log(`Received ${signal}, starting graceful shutdown...`);
+
+  // Stop accepting new connections
+  await fastify.close();
+
+  // Wait for in-flight requests (max 30 seconds)
+  await new Promise(resolve => setTimeout(resolve, 30000));
+
+  // Close connections
+  await vectorClient.close();
+
+  console.log('Graceful shutdown complete');
+  process.exit(0);
+};
+
+process.on('SIGTERM', () => gracefulShutdown('SIGTERM'));
+process.on('SIGINT', () => gracefulShutdown('SIGINT'));
+
+// Start server
+const start = async () => {
+  try {
+    const port = parseInt(process.env.PORT || '8080');
+    const host = process.env.HOST || '0.0.0.0';
+
+    await fastify.listen({ port, host });
+    console.log(`Server listening on ${host}:${port}`);
+    console.log(`Optimizations enabled: adaptive batching, compressed cache, connection pooling`);
+  } catch (err) {
+    fastify.log.error(err);
+    process.exit(1);
+  }
+};
+
+start();
+
+export default fastify;