initial

2026-01-30 03:16:57 +00:00
commit daaf6559e3
80 changed files with 14430 additions and 0 deletions
--- a/ts/models/index.ts
+++ b/ts/models/index.ts
@@ -0,0 +1,8 @@
+/**
+ * Model Management Module
+ *
+ * Exports model registry and loader functionality.
+ */
+
+export { ModelRegistry } from './registry.ts';
+export { ModelLoader } from './loader.ts';
--- a/ts/models/loader.ts
+++ b/ts/models/loader.ts
@@ -0,0 +1,291 @@
+/**
+ * Model Loader
+ *
+ * Handles automatic model loading with greenlist validation.
+ */
+
+import type { TContainerType } from '../interfaces/container.ts';
+import { logger } from '../logger.ts';
+import { ModelRegistry } from './registry.ts';
+import { ContainerManager } from '../containers/container-manager.ts';
+import { GpuDetector } from '../hardware/gpu-detector.ts';
+
+/**
+ * Model load result
+ */
+export interface IModelLoadResult {
+  success: boolean;
+  model: string;
+  container?: string;
+  error?: string;
+  alreadyLoaded?: boolean;
+}
+
+/**
+ * Model loader with greenlist validation
+ */
+export class ModelLoader {
+  private registry: ModelRegistry;
+  private containerManager: ContainerManager;
+  private gpuDetector: GpuDetector;
+  private autoPull: boolean;
+
+  constructor(
+    registry: ModelRegistry,
+    containerManager: ContainerManager,
+    autoPull: boolean = true,
+  ) {
+    this.registry = registry;
+    this.containerManager = containerManager;
+    this.gpuDetector = new GpuDetector();
+    this.autoPull = autoPull;
+  }
+
+  /**
+   * Load a model with greenlist validation
+   */
+  public async loadModel(modelName: string): Promise<IModelLoadResult> {
+    logger.info(`Loading model: ${modelName}`);
+
+    // Step 1: Check if model is already loaded in any container
+    const container = await this.containerManager.findContainerForModel(modelName);
+    if (container) {
+      logger.dim(`Model ${modelName} is already available in container ${container.getConfig().id}`);
+      return {
+        success: true,
+        model: modelName,
+        container: container.getConfig().id,
+        alreadyLoaded: true,
+      };
+    }
+
+    // Step 2: Check if model is greenlit
+    const isGreenlit = await this.registry.isModelGreenlit(modelName);
+    if (!isGreenlit) {
+      logger.error(`Model ${modelName} is not in the greenlit list`);
+      logger.info('Only greenlit models can be auto-pulled for security reasons.');
+      logger.info('Contact your administrator to add this model to the greenlist.');
+      return {
+        success: false,
+        model: modelName,
+        error: `Model "${modelName}" is not greenlit. Request via admin or add to greenlist.`,
+      };
+    }
+
+    // Step 3: Get model info from greenlist
+    const modelInfo = await this.registry.getGreenlitModel(modelName);
+    if (!modelInfo) {
+      return {
+        success: false,
+        model: modelName,
+        error: 'Failed to get model info from greenlist',
+      };
+    }
+
+    // Step 4: Check VRAM requirements
+    const gpus = await this.gpuDetector.detectGpus();
+    const totalVram = gpus.reduce((sum, gpu) => sum + gpu.vram, 0);
+    const totalVramGb = Math.round(totalVram / 1024);
+
+    if (modelInfo.minVram > totalVramGb) {
+      logger.error(`Insufficient VRAM for model ${modelName}`);
+      logger.info(`Required: ${modelInfo.minVram}GB, Available: ${totalVramGb}GB`);
+      return {
+        success: false,
+        model: modelName,
+        error: `Insufficient VRAM. Required: ${modelInfo.minVram}GB, Available: ${totalVramGb}GB`,
+      };
+    }
+
+    // Step 5: Find or create appropriate container
+    const containerType = modelInfo.container;
+    let targetContainer = await this.findAvailableContainer(containerType);
+
+    if (!targetContainer) {
+      logger.warn(`No ${containerType} container available`);
+
+      // Could auto-create container here if desired
+      return {
+        success: false,
+        model: modelName,
+        error: `No ${containerType} container available to load model`,
+      };
+    }
+
+    // Step 6: Pull the model if auto-pull is enabled
+    if (this.autoPull) {
+      logger.info(`Pulling model ${modelName} to ${containerType} container...`);
+
+      const pullSuccess = await targetContainer.pullModel(modelName, (progress) => {
+        const percent = progress.percent !== undefined ? ` (${progress.percent}%)` : '';
+        logger.dim(`  ${progress.status}${percent}`);
+      });
+
+      if (!pullSuccess) {
+        return {
+          success: false,
+          model: modelName,
+          error: 'Failed to pull model',
+        };
+      }
+    }
+
+    logger.success(`Model ${modelName} loaded successfully`);
+    return {
+      success: true,
+      model: modelName,
+      container: targetContainer.getConfig().id,
+    };
+  }
+
+  /**
+   * Find an available container of the specified type
+   */
+  private async findAvailableContainer(
+    containerType: TContainerType,
+  ): Promise<import('../containers/base-container.ts').BaseContainer | null> {
+    const containers = this.containerManager.getAllContainers();
+
+    for (const container of containers) {
+      if (container.type !== containerType) {
+        continue;
+      }
+
+      const status = await container.getStatus();
+      if (status.running) {
+        return container;
+      }
+    }
+
+    // No running container found, try to start one
+    for (const container of containers) {
+      if (container.type !== containerType) {
+        continue;
+      }
+
+      logger.info(`Starting ${containerType} container: ${container.getConfig().name}`);
+      const started = await container.start();
+      if (started) {
+        return container;
+      }
+    }
+
+    return null;
+  }
+
+  /**
+   * Preload a list of models
+   */
+  public async preloadModels(modelNames: string[]): Promise<Map<string, IModelLoadResult>> {
+    const results = new Map<string, IModelLoadResult>();
+
+    for (const modelName of modelNames) {
+      const result = await this.loadModel(modelName);
+      results.set(modelName, result);
+
+      if (!result.success) {
+        logger.warn(`Failed to preload model: ${modelName}`);
+      }
+    }
+
+    return results;
+  }
+
+  /**
+   * Unload a model from a container
+   */
+  public async unloadModel(modelName: string): Promise<boolean> {
+    const container = await this.containerManager.findContainerForModel(modelName);
+    if (!container) {
+      logger.warn(`Model ${modelName} not found in any container`);
+      return false;
+    }
+
+    return container.removeModel(modelName);
+  }
+
+  /**
+   * Check if auto-pull is enabled
+   */
+  public isAutoPullEnabled(): boolean {
+    return this.autoPull;
+  }
+
+  /**
+   * Enable or disable auto-pull
+   */
+  public setAutoPull(enabled: boolean): void {
+    this.autoPull = enabled;
+  }
+
+  /**
+   * Get loading recommendations for available VRAM
+   */
+  public async getRecommendations(): Promise<{
+    canLoad: string[];
+    cannotLoad: string[];
+    loaded: string[];
+  }> {
+    const gpus = await this.gpuDetector.detectGpus();
+    const totalVramGb = Math.round(gpus.reduce((sum, gpu) => sum + gpu.vram, 0) / 1024);
+
+    const allModels = await this.registry.getAllGreenlitModels();
+    const availableModels = await this.containerManager.getAllAvailableModels();
+    const loadedNames = new Set(availableModels.keys());
+
+    const canLoad: string[] = [];
+    const cannotLoad: string[] = [];
+    const loaded: string[] = [];
+
+    for (const model of allModels) {
+      if (loadedNames.has(model.name)) {
+        loaded.push(model.name);
+      } else if (model.minVram <= totalVramGb) {
+        canLoad.push(model.name);
+      } else {
+        cannotLoad.push(model.name);
+      }
+    }
+
+    return { canLoad, cannotLoad, loaded };
+  }
+
+  /**
+   * Print loading status
+   */
+  public async printStatus(): Promise<void> {
+    const recommendations = await this.getRecommendations();
+
+    logger.logBoxTitle('Model Loading Status', 60, 'info');
+
+    logger.logBoxLine(`Loaded Models (${recommendations.loaded.length}):`);
+    if (recommendations.loaded.length > 0) {
+      for (const model of recommendations.loaded) {
+        logger.logBoxLine(`  - ${model}`);
+      }
+    } else {
+      logger.logBoxLine('  None');
+    }
+
+    logger.logBoxLine('');
+    logger.logBoxLine(`Available to Load (${recommendations.canLoad.length}):`);
+    for (const model of recommendations.canLoad.slice(0, 5)) {
+      logger.logBoxLine(`  - ${model}`);
+    }
+    if (recommendations.canLoad.length > 5) {
+      logger.logBoxLine(`  ... and ${recommendations.canLoad.length - 5} more`);
+    }
+
+    logger.logBoxLine('');
+    logger.logBoxLine(`Insufficient VRAM (${recommendations.cannotLoad.length}):`);
+    for (const model of recommendations.cannotLoad.slice(0, 3)) {
+      const info = await this.registry.getGreenlitModel(model);
+      logger.logBoxLine(`  - ${model} (needs ${info?.minVram || '?'}GB)`);
+    }
+    if (recommendations.cannotLoad.length > 3) {
+      logger.logBoxLine(`  ... and ${recommendations.cannotLoad.length - 3} more`);
+    }
+
+    logger.logBoxEnd();
+  }
+}
--- a/ts/models/registry.ts
+++ b/ts/models/registry.ts
@@ -0,0 +1,252 @@
+/**
+ * Model Registry
+ *
+ * Manages the greenlit model list and model availability.
+ */
+
+import type { IGreenlitModel, IGreenlitModelsList } from '../interfaces/config.ts';
+import type { TContainerType } from '../interfaces/container.ts';
+import { MODEL_REGISTRY, TIMING } from '../constants.ts';
+import { logger } from '../logger.ts';
+
+/**
+ * Model registry for managing greenlit models
+ */
+export class ModelRegistry {
+  private greenlistUrl: string;
+  private cachedGreenlist: IGreenlitModelsList | null = null;
+  private cacheTime: number = 0;
+
+  constructor(greenlistUrl: string = MODEL_REGISTRY.DEFAULT_GREENLIST_URL) {
+    this.greenlistUrl = greenlistUrl;
+  }
+
+  /**
+   * Set the greenlist URL
+   */
+  public setGreenlistUrl(url: string): void {
+    this.greenlistUrl = url;
+    this.cachedGreenlist = null;
+    this.cacheTime = 0;
+  }
+
+  /**
+   * Fetch the greenlit model list from remote URL
+   */
+  public async fetchGreenlist(forceRefresh: boolean = false): Promise<IGreenlitModelsList> {
+    // Return cached data if still valid
+    if (
+      !forceRefresh &&
+      this.cachedGreenlist &&
+      Date.now() - this.cacheTime < TIMING.GREENLIST_CACHE_DURATION_MS
+    ) {
+      return this.cachedGreenlist;
+    }
+
+    try {
+      logger.dim(`Fetching greenlit models from: ${this.greenlistUrl}`);
+
+      const controller = new AbortController();
+      const timeout = setTimeout(() => controller.abort(), 30000);
+
+      const response = await fetch(this.greenlistUrl, {
+        signal: controller.signal,
+        headers: {
+          'Accept': 'application/json',
+          'User-Agent': 'ModelGrid/1.0',
+        },
+      });
+
+      clearTimeout(timeout);
+
+      if (!response.ok) {
+        throw new Error(`HTTP ${response.status}: ${response.statusText}`);
+      }
+
+      const greenlist = await response.json() as IGreenlitModelsList;
+
+      // Validate structure
+      if (!greenlist.models || !Array.isArray(greenlist.models)) {
+        throw new Error('Invalid greenlist format: missing models array');
+      }
+
+      // Cache the result
+      this.cachedGreenlist = greenlist;
+      this.cacheTime = Date.now();
+
+      logger.dim(`Loaded ${greenlist.models.length} greenlit models`);
+      return greenlist;
+    } catch (error) {
+      logger.warn(`Failed to fetch greenlist: ${error instanceof Error ? error.message : String(error)}`);
+
+      // Return fallback if we have no cache
+      if (!this.cachedGreenlist) {
+        logger.dim('Using fallback greenlist');
+        return this.getFallbackGreenlist();
+      }
+
+      // Return stale cache
+      return this.cachedGreenlist;
+    }
+  }
+
+  /**
+   * Get fallback greenlist
+   */
+  private getFallbackGreenlist(): IGreenlitModelsList {
+    return {
+      version: '1.0',
+      lastUpdated: new Date().toISOString(),
+      models: MODEL_REGISTRY.FALLBACK_GREENLIST as unknown as IGreenlitModel[],
+    };
+  }
+
+  /**
+   * Check if a model is greenlit
+   */
+  public async isModelGreenlit(modelName: string): Promise<boolean> {
+    const greenlist = await this.fetchGreenlist();
+    return greenlist.models.some((m) => this.normalizeModelName(m.name) === this.normalizeModelName(modelName));
+  }
+
+  /**
+   * Get greenlit model info
+   */
+  public async getGreenlitModel(modelName: string): Promise<IGreenlitModel | null> {
+    const greenlist = await this.fetchGreenlist();
+    const normalized = this.normalizeModelName(modelName);
+    return greenlist.models.find((m) => this.normalizeModelName(m.name) === normalized) || null;
+  }
+
+  /**
+   * Get all greenlit models
+   */
+  public async getAllGreenlitModels(): Promise<IGreenlitModel[]> {
+    const greenlist = await this.fetchGreenlist();
+    return greenlist.models;
+  }
+
+  /**
+   * Get greenlit models by container type
+   */
+  public async getModelsByContainer(containerType: TContainerType): Promise<IGreenlitModel[]> {
+    const greenlist = await this.fetchGreenlist();
+    return greenlist.models.filter((m) => m.container === containerType);
+  }
+
+  /**
+   * Get greenlit models that fit within VRAM limit
+   */
+  public async getModelsWithinVram(maxVramGb: number): Promise<IGreenlitModel[]> {
+    const greenlist = await this.fetchGreenlist();
+    return greenlist.models.filter((m) => m.minVram <= maxVramGb);
+  }
+
+  /**
+   * Get recommended container type for a model
+   */
+  public async getRecommendedContainer(modelName: string): Promise<TContainerType | null> {
+    const model = await this.getGreenlitModel(modelName);
+    return model ? model.container : null;
+  }
+
+  /**
+   * Get minimum VRAM required for a model
+   */
+  public async getMinVram(modelName: string): Promise<number | null> {
+    const model = await this.getGreenlitModel(modelName);
+    return model ? model.minVram : null;
+  }
+
+  /**
+   * Check if model fits in available VRAM
+   */
+  public async modelFitsInVram(modelName: string, availableVramGb: number): Promise<boolean> {
+    const minVram = await this.getMinVram(modelName);
+    if (minVram === null) {
+      // Model not in greenlist, assume it might fit
+      return true;
+    }
+    return availableVramGb >= minVram;
+  }
+
+  /**
+   * Normalize model name for comparison
+   * Handles variations like "llama3:8b" vs "llama3:8B" vs "meta-llama/llama-3-8b"
+   */
+  private normalizeModelName(name: string): string {
+    return name
+      .toLowerCase()
+      .replace(/[^a-z0-9:.-]/g, '')
+      .trim();
+  }
+
+  /**
+   * Search models by name pattern
+   */
+  public async searchModels(pattern: string): Promise<IGreenlitModel[]> {
+    const greenlist = await this.fetchGreenlist();
+    const normalizedPattern = pattern.toLowerCase();
+
+    return greenlist.models.filter((m) =>
+      m.name.toLowerCase().includes(normalizedPattern) ||
+      m.description?.toLowerCase().includes(normalizedPattern) ||
+      m.tags?.some((t) => t.toLowerCase().includes(normalizedPattern))
+    );
+  }
+
+  /**
+   * Get models by tags
+   */
+  public async getModelsByTags(tags: string[]): Promise<IGreenlitModel[]> {
+    const greenlist = await this.fetchGreenlist();
+    const normalizedTags = tags.map((t) => t.toLowerCase());
+
+    return greenlist.models.filter((m) =>
+      m.tags?.some((t) => normalizedTags.includes(t.toLowerCase()))
+    );
+  }
+
+  /**
+   * Clear the cached greenlist
+   */
+  public clearCache(): void {
+    this.cachedGreenlist = null;
+    this.cacheTime = 0;
+  }
+
+  /**
+   * Print greenlist summary
+   */
+  public async printSummary(): Promise<void> {
+    const greenlist = await this.fetchGreenlist();
+
+    // Group by container type
+    const byContainer = new Map<string, IGreenlitModel[]>();
+    for (const model of greenlist.models) {
+      if (!byContainer.has(model.container)) {
+        byContainer.set(model.container, []);
+      }
+      byContainer.get(model.container)!.push(model);
+    }
+
+    logger.logBoxTitle('Greenlit Models', 60, 'info');
+    logger.logBoxLine(`Version: ${greenlist.version}`);
+    logger.logBoxLine(`Last Updated: ${greenlist.lastUpdated}`);
+    logger.logBoxLine(`Total Models: ${greenlist.models.length}`);
+    logger.logBoxLine('');
+
+    for (const [container, models] of byContainer) {
+      logger.logBoxLine(`${container.toUpperCase()} (${models.length}):`);
+      for (const model of models.slice(0, 5)) {
+        logger.logBoxLine(`  - ${model.name} (${model.minVram}GB VRAM)`);
+      }
+      if (models.length > 5) {
+        logger.logBoxLine(`  ... and ${models.length - 5} more`);
+      }
+      logger.logBoxLine('');
+    }
+
+    logger.logBoxEnd();
+  }
+}