Merge commit 'd803bfe2b1fe7f5e219e50ac20d6801a0a58ac75' as 'vendor/ruvector'

2026-02-28 14:39:40 -05:00
parent 7885bf6278 d803bfe2b1
commit cd5943df23
7854 changed files with 3522914 additions and 0 deletions
--- a/vendor/ruvector/npm/packages/cloud-run/streaming-service-optimized.js
+++ b/vendor/ruvector/npm/packages/cloud-run/streaming-service-optimized.js
@@ -0,0 +1,465 @@
+"use strict";
+var __importDefault = (this && this.__importDefault) || function (mod) {
+    return (mod && mod.__esModule) ? mod : { "default": mod };
+};
+Object.defineProperty(exports, "__esModule", { value: true });
+const fastify_1 = __importDefault(require("fastify"));
+const helmet_1 = __importDefault(require("@fastify/helmet"));
+const compress_1 = __importDefault(require("@fastify/compress"));
+const rate_limit_1 = __importDefault(require("@fastify/rate-limit"));
+const websocket_1 = __importDefault(require("@fastify/websocket"));
+const vector_client_1 = require("./vector-client");
+const load_balancer_1 = require("./load-balancer");
+const events_1 = __importDefault(require("events"));
+// ===== ADVANCED OPTIMIZATIONS =====
+// 1. ADAPTIVE BATCHING WITH PRIORITY QUEUES
+class AdaptiveBatcher extends events_1.default {
+    constructor() {
+        super();
+        this.queues = new Map();
+        this.timers = new Map();
+        this.batchSizes = new Map();
+        // Dynamic batch size based on load
+        this.MIN_BATCH = 10;
+        this.MAX_BATCH = 500;
+        this.TARGET_LATENCY_MS = 5;
+        // Initialize priority queues
+        ['critical', 'high', 'normal', 'low'].forEach(priority => {
+            this.queues.set(priority, []);
+            this.batchSizes.set(priority, 50);
+        });
+        // Adaptive tuning every 10 seconds
+        setInterval(() => this.tuneParameters(), 10000);
+    }
+    async add(item, priority = 'normal') {
+        const queue = this.queues.get(priority) || this.queues.get('normal');
+        return new Promise((resolve, reject) => {
+            queue.push({ ...item, resolve, reject, addedAt: Date.now() });
+            const batchSize = this.batchSizes.get(priority) || 50;
+            if (queue.length >= batchSize) {
+                this.flush(priority);
+            }
+            else if (!this.timers.has(priority)) {
+                // Dynamic timeout based on queue length
+                const timeout = Math.max(1, this.TARGET_LATENCY_MS - queue.length);
+                this.timers.set(priority, setTimeout(() => this.flush(priority), timeout));
+            }
+        });
+    }
+    async flush(priority) {
+        const queue = this.queues.get(priority);
+        if (!queue || queue.length === 0)
+            return;
+        const timer = this.timers.get(priority);
+        if (timer) {
+            clearTimeout(timer);
+            this.timers.delete(priority);
+        }
+        const batch = queue.splice(0, this.batchSizes.get(priority) || 50);
+        const startTime = Date.now();
+        try {
+            this.emit('batch', { priority, size: batch.length });
+            const results = await this.processBatch(batch.map(b => b.query));
+            results.forEach((result, i) => {
+                batch[i].resolve(result);
+            });
+            // Track latency for adaptive tuning
+            const latency = Date.now() - startTime;
+            this.emit('latency', { priority, latency, batchSize: batch.length });
+        }
+        catch (error) {
+            batch.forEach(b => b.reject(error));
+        }
+    }
+    async processBatch(queries) {
+        // Override in subclass
+        return queries;
+    }
+    tuneParameters() {
+        // Adaptive batch size based on recent performance
+        this.queues.forEach((queue, priority) => {
+            const currentSize = this.batchSizes.get(priority) || 50;
+            const queueLength = queue.length;
+            let newSize = currentSize;
+            if (queueLength > currentSize * 2) {
+                // Queue backing up, increase batch size
+                newSize = Math.min(this.MAX_BATCH, currentSize * 1.2);
+            }
+            else if (queueLength < currentSize * 0.3) {
+                // Queue empty, decrease batch size
+                newSize = Math.max(this.MIN_BATCH, currentSize * 0.8);
+            }
+            this.batchSizes.set(priority, Math.round(newSize));
+        });
+    }
+}
+// 2. MULTI-LEVEL CACHE WITH COMPRESSION
+class CompressedCache {
+    constructor(redis) {
+        this.compressionThreshold = 1024; // bytes
+        this.l1 = new Map();
+        this.l2 = redis;
+        // LRU eviction for L1 every minute
+        setInterval(() => this.evictL1(), 60000);
+    }
+    async get(key) {
+        // Check L1 (in-memory)
+        if (this.l1.has(key)) {
+            return this.l1.get(key);
+        }
+        // Check L2 (Redis)
+        const compressed = await this.l2.getBuffer(key);
+        if (compressed) {
+            const value = await this.decompress(compressed);
+            // Promote to L1
+            this.l1.set(key, value);
+            return value;
+        }
+        return null;
+    }
+    async set(key, value, ttl = 3600) {
+        // Set L1
+        this.l1.set(key, value);
+        // Set L2 with compression for large values
+        const serialized = JSON.stringify(value);
+        const buffer = Buffer.from(serialized);
+        if (buffer.length > this.compressionThreshold) {
+            const compressed = await this.compress(buffer);
+            await this.l2.setex(key, ttl, compressed);
+        }
+        else {
+            await this.l2.setex(key, ttl, serialized);
+        }
+    }
+    async compress(buffer) {
+        const { promisify } = require('util');
+        const { brotliCompress } = require('zlib');
+        const compress = promisify(brotliCompress);
+        return compress(buffer);
+    }
+    async decompress(buffer) {
+        const { promisify } = require('util');
+        const { brotliDecompress } = require('zlib');
+        const decompress = promisify(brotliDecompress);
+        const decompressed = await decompress(buffer);
+        return JSON.parse(decompressed.toString());
+    }
+    evictL1() {
+        if (this.l1.size > 10000) {
+            const toDelete = this.l1.size - 8000;
+            const keys = Array.from(this.l1.keys()).slice(0, toDelete);
+            keys.forEach(k => this.l1.delete(k));
+        }
+    }
+}
+// 3. CONNECTION POOLING WITH HEALTH CHECKS
+class AdvancedConnectionPool {
+    constructor() {
+        this.pools = new Map();
+        this.healthScores = new Map();
+        this.maxPerPool = 100;
+        this.minPerPool = 10;
+        // Health check every 30 seconds
+        setInterval(() => this.healthCheck(), 30000);
+    }
+    async acquire(poolId) {
+        let pool = this.pools.get(poolId);
+        if (!pool) {
+            pool = [];
+            this.pools.set(poolId, pool);
+            this.healthScores.set(poolId, 1.0);
+        }
+        // Try to get healthy connection
+        let connection = null;
+        while (pool.length > 0 && !connection) {
+            const candidate = pool.pop();
+            if (await this.isHealthy(candidate)) {
+                connection = candidate;
+            }
+        }
+        // Create new if needed
+        if (!connection) {
+            connection = await this.createConnection(poolId);
+        }
+        return connection;
+    }
+    async release(poolId, connection) {
+        const pool = this.pools.get(poolId);
+        if (pool && pool.length < this.maxPerPool) {
+            pool.push(connection);
+        }
+        else {
+            await this.closeConnection(connection);
+        }
+    }
+    async isHealthy(connection) {
+        try {
+            await connection.ping();
+            return true;
+        }
+        catch {
+            return false;
+        }
+    }
+    async healthCheck() {
+        for (const [poolId, pool] of this.pools) {
+            let healthy = 0;
+            for (const conn of pool) {
+                if (await this.isHealthy(conn)) {
+                    healthy++;
+                }
+            }
+            const healthScore = pool.length > 0 ? healthy / pool.length : 1.0;
+            this.healthScores.set(poolId, healthScore);
+            // Maintain minimum pool size
+            while (pool.length < this.minPerPool) {
+                pool.push(await this.createConnection(poolId));
+            }
+        }
+    }
+    async createConnection(poolId) {
+        // Override in subclass
+        return { poolId, id: Math.random() };
+    }
+    async closeConnection(connection) {
+        // Override in subclass
+    }
+    getHealthScore(poolId) {
+        return this.healthScores.get(poolId) || 0;
+    }
+}
+// 4. RESULT STREAMING WITH BACKPRESSURE
+class StreamingResponder {
+    constructor() {
+        this.maxBufferSize = 1000;
+    }
+    async streamResults(query, processor, response) {
+        response.raw.setHeader('Content-Type', 'application/x-ndjson');
+        response.raw.setHeader('Cache-Control', 'no-cache');
+        response.raw.setHeader('X-Accel-Buffering', 'no'); // Disable nginx buffering
+        let bufferSize = 0;
+        let backpressure = false;
+        for await (const result of processor) {
+            // Check backpressure
+            if (!response.raw.write(JSON.stringify(result) + '\n')) {
+                backpressure = true;
+                await new Promise(resolve => response.raw.once('drain', resolve));
+                backpressure = false;
+            }
+            bufferSize++;
+            // Apply backpressure to source if buffer too large
+            if (bufferSize > this.maxBufferSize) {
+                await new Promise(resolve => setTimeout(resolve, 10));
+                bufferSize = Math.max(0, bufferSize - 100);
+            }
+        }
+        response.raw.end();
+    }
+}
+// 5. QUERY PLAN CACHE (for complex filters)
+class QueryPlanCache {
+    constructor() {
+        this.cache = new Map();
+        this.stats = new Map();
+    }
+    getPlan(filter) {
+        const key = this.getKey(filter);
+        const plan = this.cache.get(key);
+        if (plan) {
+            const stat = this.stats.get(key) || { hits: 0, avgTime: 0 };
+            stat.hits++;
+            this.stats.set(key, stat);
+        }
+        return plan;
+    }
+    cachePlan(filter, plan, executionTime) {
+        const key = this.getKey(filter);
+        this.cache.set(key, plan);
+        const stat = this.stats.get(key) || { hits: 0, avgTime: 0 };
+        stat.avgTime = (stat.avgTime * stat.hits + executionTime) / (stat.hits + 1);
+        this.stats.set(key, stat);
+        // Evict least valuable plans
+        if (this.cache.size > 1000) {
+            this.evictLowValue();
+        }
+    }
+    getKey(filter) {
+        return JSON.stringify(filter, Object.keys(filter).sort());
+    }
+    evictLowValue() {
+        // Calculate value score: hits / avgTime
+        const scored = Array.from(this.stats.entries())
+            .map(([key, stat]) => ({
+            key,
+            score: stat.hits / (stat.avgTime + 1)
+        }))
+            .sort((a, b) => a.score - b.score);
+        // Remove bottom 20%
+        const toRemove = Math.floor(scored.length * 0.2);
+        for (let i = 0; i < toRemove; i++) {
+            this.cache.delete(scored[i].key);
+            this.stats.delete(scored[i].key);
+        }
+    }
+}
+// 6. OPTIMIZED MAIN SERVICE
+const fastify = (0, fastify_1.default)({
+    logger: true,
+    trustProxy: true,
+    http2: true,
+    requestIdHeader: 'x-request-id',
+    requestIdLogLabel: 'reqId',
+    disableRequestLogging: true, // Custom logging for better performance
+    ignoreTrailingSlash: true,
+    maxParamLength: 500,
+    bodyLimit: 1048576, // 1MB
+    keepAliveTimeout: 65000, // Longer than ALB timeout
+    connectionTimeout: 70000,
+});
+// Register plugins
+fastify.register(helmet_1.default, {
+    contentSecurityPolicy: false,
+    global: true,
+});
+fastify.register(compress_1.default, {
+    global: true,
+    threshold: 1024,
+    encodings: ['br', 'gzip', 'deflate'],
+    brotliOptions: {
+        params: {
+            [require('zlib').constants.BROTLI_PARAM_MODE]: require('zlib').constants.BROTLI_MODE_TEXT,
+            [require('zlib').constants.BROTLI_PARAM_QUALITY]: 4, // Fast compression
+        }
+    },
+    zlibOptions: {
+        level: 6, // Balanced
+    }
+});
+// Redis-based rate limiting for distributed environment
+fastify.register(rate_limit_1.default, {
+    global: true,
+    max: 1000,
+    timeWindow: '1 minute',
+    cache: 10000,
+    allowList: ['127.0.0.1'],
+    redis: process.env.REDIS_URL ? require('ioredis').createClient(process.env.REDIS_URL) : undefined,
+    nameSpace: 'ruvector:ratelimit:',
+    continueExceeding: true,
+    enableDraftSpec: true,
+});
+fastify.register(websocket_1.default, {
+    options: {
+        maxPayload: 1048576,
+        clientTracking: true,
+        perMessageDeflate: {
+            zlibDeflateOptions: {
+                level: 6,
+            },
+            threshold: 1024,
+        }
+    }
+});
+// Initialize optimized components
+const vectorClient = new vector_client_1.VectorClient({
+    host: process.env.RUVECTOR_HOST || 'localhost',
+    port: parseInt(process.env.RUVECTOR_PORT || '50051'),
+    maxConnections: parseInt(process.env.MAX_CONNECTIONS || '100'),
+    minConnections: parseInt(process.env.MIN_CONNECTIONS || '10'),
+    enableCache: true,
+    cacheTTL: 3600,
+});
+const loadBalancer = new load_balancer_1.LoadBalancer({
+    backends: (process.env.BACKEND_URLS || '').split(','),
+    healthCheckInterval: 30000,
+    circuitBreakerThreshold: 5,
+    circuitBreakerTimeout: 60000,
+});
+const batcher = new AdaptiveBatcher();
+const queryPlanCache = new QueryPlanCache();
+const streamer = new StreamingResponder();
+// Setup adaptive batching
+class VectorBatcher extends AdaptiveBatcher {
+    async processBatch(queries) {
+        return vectorClient.batchQuery(queries);
+    }
+}
+const vectorBatcher = new VectorBatcher();
+// Optimized batch query endpoint with plan caching
+fastify.post('/api/query/batch', async (request, reply) => {
+    const { queries, priority = 'normal' } = request.body;
+    const results = await Promise.all(queries.map((query) => vectorBatcher.add(query, priority)));
+    return { results, count: results.length };
+});
+// Streaming query with backpressure
+fastify.get('/api/query/stream', async (request, reply) => {
+    const { vector, topK = 10, filters } = request.query;
+    // Check query plan cache
+    let plan = filters ? queryPlanCache.getPlan(filters) : null;
+    async function* resultGenerator() {
+        const startTime = Date.now();
+        for await (const result of vectorClient.streamQuery({ vector, topK, filters, plan })) {
+            yield result;
+        }
+        // Cache the plan if it was efficient
+        if (filters && !plan) {
+            const executionTime = Date.now() - startTime;
+            queryPlanCache.cachePlan(filters, { ...filters, optimized: true }, executionTime);
+        }
+    }
+    await streamer.streamResults({ vector, topK, filters }, resultGenerator(), reply);
+});
+// Health endpoint with detailed status
+fastify.get('/health', async (request, reply) => {
+    const health = {
+        status: 'healthy',
+        timestamp: new Date().toISOString(),
+        uptime: process.uptime(),
+        memory: process.memoryUsage(),
+        connections: {
+            active: vectorClient.getActiveConnections(),
+            poolSize: vectorClient.getPoolSize(),
+        },
+        cache: {
+            hitRate: vectorClient.getCacheHitRate(),
+            size: vectorClient.getCacheSize(),
+        },
+        batcher: {
+            queueSizes: {},
+        },
+        loadBalancer: {
+            backends: loadBalancer.getBackendHealth(),
+        },
+    };
+    return health;
+});
+// Graceful shutdown
+const gracefulShutdown = async (signal) => {
+    console.log(`Received ${signal}, starting graceful shutdown...`);
+    // Stop accepting new connections
+    await fastify.close();
+    // Wait for in-flight requests (max 30 seconds)
+    await new Promise(resolve => setTimeout(resolve, 30000));
+    // Close connections
+    await vectorClient.close();
+    console.log('Graceful shutdown complete');
+    process.exit(0);
+};
+process.on('SIGTERM', () => gracefulShutdown('SIGTERM'));
+process.on('SIGINT', () => gracefulShutdown('SIGINT'));
+// Start server
+const start = async () => {
+    try {
+        const port = parseInt(process.env.PORT || '8080');
+        const host = process.env.HOST || '0.0.0.0';
+        await fastify.listen({ port, host });
+        console.log(`Server listening on ${host}:${port}`);
+        console.log(`Optimizations enabled: adaptive batching, compressed cache, connection pooling`);
+    }
+    catch (err) {
+        fastify.log.error(err);
+        process.exit(1);
+    }
+};
+start();
+exports.default = fastify;
+//# sourceMappingURL=streaming-service-optimized.js.map