wizenheimer
diff --git a/‎src/AudioModule.ts‎
Lines changed: 4 additions & 23 deletions b/‎src/AudioModule.ts‎
Lines changed: 4 additions & 23 deletions
diff --git a/‎src/BaseModule.ts‎
Lines changed: 1 addition & 44 deletions b/‎src/BaseModule.ts‎
Lines changed: 1 addition & 44 deletions
diff --git a/‎src/EmbeddingsModule.ts‎
Lines changed: 11 additions & 17 deletions b/‎src/EmbeddingsModule.ts‎
Lines changed: 11 additions & 17 deletions
diff --git a/‎src/GenerationModule.ts‎
Lines changed: 5 additions & 11 deletions b/‎src/GenerationModule.ts‎
Lines changed: 5 additions & 11 deletions
diff --git a/‎src/Models.ts‎
Lines changed: 131 additions & 0 deletions b/‎src/Models.ts‎
Lines changed: 131 additions & 0 deletions
@@ -31,13 +31,10 @@ export class AudioModule extends BaseModule {
 
     const { ttsModels = [], lazyLoad = false } = options;
 
-    // Check hardware capabilities
-    const capabilities = await this.webgpuChecker.check();
-
     this.progressTracker.update({
       status: 'init',
       type: 'audio_module',
-      message: `Hardware check: WebGPU ${capabilities.isWebGPUSupported ? 'available' : 'not available'}`
+      // message: `Hardware check: WebGPU ${capabilities.isWebGPUSupported ? 'available' : 'not available'}` FIX ME:
     });
 
     // Load first model if specified and not using lazy loading
@@ -92,26 +89,13 @@ export class AudioModule extends BaseModule {
     this.activeModel = model;
 
     try {
-      // Check hardware capabilities
-      const capabilities = await this.webgpuChecker.check();
-
-      // Get optimal config
-      const config = await this.getOptimalDeviceConfig();
-
-      // For TTS models, always use CPU in Node.js environment or proper fallback
-      const isNode = this.isNodeEnvironment();
-
-      // Determine device explicitly
-      const device = isNode ? "cpu" :
-                    !capabilities.isWebGPUSupported ? "wasm" : "webgpu";
-
       // Initial progress message
       this.progressTracker.update({
         status: 'loading',
         type: 'tts_model',
         progress: 0,
         percentComplete: 0,
-        message: `Loading TTS model ${model} (device="${device}", dtype="${config.dtype}")`
+        // message: `Loading TTS model ${model} (device="${device}", dtype="${config.dtype}")` FIX ME:
       });
 
       // Load the model directly by name
@@ -126,8 +110,8 @@ export class AudioModule extends BaseModule {
             ...progress
           });
         },
-        device: device,
-        dtype: config.dtype
+        device: 'webgpu', // device, FIX ME:
+        dtype: 'fp16', // config.dtype FIX ME:
       });
 
       // Register the model as loaded
@@ -281,9 +265,6 @@ export class AudioModule extends BaseModule {
         this.activeModel = null;
       }
 
-      // Try to trigger garbage collection
-      this.triggerGC();
-
       this.progressTracker.update({
         status: 'offloaded',
         type: 'tts_model',
 
@@ -3,10 +3,8 @@
  * Provides common structure for all modules like generation, embeddings, etc.
  */
 
-import { WebGPUChecker } from './WebGPUChecker';
 import { ProgressTracker } from './ProgressTracker';
-import { tryGarbageCollection, EnvironmentInfo } from './utils';
-import { DeviceConfig } from './types';
+import { DeviceConfig } from './Models';
 
 /**
  * Base interface for TinyLM modules
@@ -26,8 +24,6 @@ export interface TinyLMModule {
 export abstract class BaseModule implements TinyLMModule {
   protected tinyLM: any;
   protected progressTracker: ProgressTracker;
-  protected webgpuChecker: WebGPUChecker;
-  protected environment: EnvironmentInfo;
 
   /**
    * Create a new module
@@ -36,8 +32,6 @@ export abstract class BaseModule implements TinyLMModule {
   constructor(tinyLM: any) {
     this.tinyLM = tinyLM;
     this.progressTracker = tinyLM.getProgressTracker();
-    this.webgpuChecker = tinyLM.getWebGPUChecker();
-    this.environment = tinyLM.getEnvironment();
   }
 
   /**
@@ -48,41 +42,4 @@ export abstract class BaseModule implements TinyLMModule {
   async init(options: Record<string, any> = {}): Promise<void> {
     // Base initialization code
   }
-
-  /**
-   * Get optimal device configuration based on capabilities
-   * @returns {Promise<DeviceConfig>} Device configuration
-   */
-  protected async getOptimalDeviceConfig(): Promise<DeviceConfig> {
-    const capabilities = await this.webgpuChecker.check();
-    return this.webgpuChecker.getOptimalConfig();
-  }
-
-  /**
-   * Trigger garbage collection if available
-   */
-  protected triggerGC(): void {
-    try {
-      // Use the utility function
-      tryGarbageCollection();
-    } catch (error) {
-      // Ignore errors
-    }
-  }
-
-  /**
-   * Check if running in a Node.js environment
-   * @returns {boolean} True if in Node.js environment
-   */
-  protected isNodeEnvironment(): boolean {
-    return this.environment.isNode;
-  }
-
-  /**
-   * Check if running in a browser environment
-   * @returns {boolean} True if in browser environment
-   */
-  protected isBrowserEnvironment(): boolean {
-    return this.environment.isBrowser;
-  }
 }
@@ -152,25 +152,22 @@ export class EmbeddingsModule extends BaseModule {
     });
 
     try {
-      // Check WebGPU capabilities and get optimal config
-      const capabilities = await this.webgpuChecker.check();
-      const config = await this.getOptimalDeviceConfig();
-
       let modelInfo: EmbeddingModelInfo;
 
       // Strategy based on WebGPU availability
-      if (capabilities.isWebGPUSupported) {
+      // if (capabilities.isWebGPUSupported) { FIX ME:
+      if (true) {
         // WebGPU is available - try direct tokenizer+model approach first
         try {
-          modelInfo = await this._loadWithTokenizerAndModel(model, config);
+          modelInfo = await this._loadWithTokenizerAndModel(model);
         } catch (directError) {
           // Direct approach failed, fall back to pipeline
           console.warn('Direct model loading failed, falling back to pipeline:', directError);
-          modelInfo = await this._loadWithPipeline(model, config);
+          modelInfo = await this._loadWithPipeline(model);
         }
       } else {
         // WebGPU not available - use pipeline approach for simplicity
-        modelInfo = await this._loadWithPipeline(model, config);
+        modelInfo = await this._loadWithPipeline(model);
       }
 
       // Validate dimensions if specified
@@ -207,7 +204,8 @@ export class EmbeddingsModule extends BaseModule {
    * @param {any} config - Device configuration
    * @returns {Promise<EmbeddingModelInfo>} Model information
    */
-  private async _loadWithTokenizerAndModel(model: string, config: any): Promise<EmbeddingModelInfo> {
+  // private async _loadWithTokenizerAndModel(model: string, config: DeviceConfig): Promise<EmbeddingModelInfo> { FIX ME:
+  private async _loadWithTokenizerAndModel(model: string): Promise<EmbeddingModelInfo> {
     // Progress callback for loading
     const progressCallback = (component: string) => (progress: any) => {
       this.progressTracker.update({
@@ -228,8 +226,6 @@ export class EmbeddingsModule extends BaseModule {
 
     // Load model with optimal configuration
     const embeddingModel = await AutoModel.from_pretrained(model, {
-      ...(config.device ? { device: config.device } : {}),
-      ...(config.dtype ? { dtype: config.dtype } : {}),
       progress_callback: progressCallback('model')
     });
 
@@ -250,11 +246,12 @@ export class EmbeddingsModule extends BaseModule {
    * @param {any} config - Device configuration
    * @returns {Promise<EmbeddingModelInfo>} Model information
    */
-  private async _loadWithPipeline(model: string, config: any): Promise<EmbeddingModelInfo> {
+  // private async _loadWithPipeline(model: string, config: any): Promise<EmbeddingModelInfo> {
+  private async _loadWithPipeline(model: string): Promise<EmbeddingModelInfo> {
     // Load using feature-extraction pipeline
     const embeddingPipeline = await pipeline('feature-extraction', model, {
-      ...(config.device ? { device: config.device } : {}),
-      ...(config.dtype ? { dtype: config.dtype } : {}),
+      // ...(config.device ? { device: config.device } : {}),
+      // ...(config.dtype ? { dtype: config.dtype } : {}),
       progress_callback: (progress: any) => {
         this.progressTracker.update({
           status: 'loading',
@@ -459,9 +456,6 @@ export class EmbeddingsModule extends BaseModule {
       // Remove from registry
       this.embeddingModels.delete(model);
 
-      // Try to trigger garbage collection
-      this.triggerGC();
-
       this.progressTracker.update({
         status: 'offloaded',
         type: 'embedding_model',
 
@@ -57,13 +57,10 @@ export class GenerationModule extends BaseModule {
 
     const { models = [], lazyLoad = false } = options;
 
-    // Check hardware capabilities
-    const capabilities = await this.webgpuChecker.check();
-
     this.progressTracker.update({
       status: 'init',
       type: 'generation_module',
-      message: `Hardware check: WebGPU ${capabilities.isWebGPUSupported ? 'available' : 'not available'}`
+      // message: `Hardware check: WebGPU ${capabilities.isWebGPUSupported ? 'available' : 'not available'}` FIX ME:
     });
 
     // Load first model if specified and not using lazy loading
@@ -122,14 +119,14 @@ export class GenerationModule extends BaseModule {
 
     try {
       // Check hardware capabilities
-      const capabilities = await this.webgpuChecker.check();
+      // const capabilities = await this.webgpuChecker.check();
 
       // Get optimal config (or use user-provided quantization)
-      const config = await this.getOptimalDeviceConfig();
+      // const config = await this.getOptimalDeviceConfig();
       const modelConfig: Record<string, any> = {
         // Only specify device and dtype if we have definitive information
-        ...(config.device ? { device: config.device } : {}),
-        ...(config.dtype || quantization ? { dtype: quantization || config.dtype } : {})
+        // ...(config.device ? { device: config.device } : {}),
+        // ...(config.dtype || quantization ? { dtype: quantization || config.dtype } : {}) FIX ME:
       };
 
       // Initialize file progress tracker for this model load
@@ -326,9 +323,6 @@ export class GenerationModule extends BaseModule {
         this.activeModel = null;
       }
 
-      // Try to trigger garbage collection
-      this.triggerGC();
-
       this.progressTracker.update({
         status: 'offloaded',
         type: 'model',
 
@@ -0,0 +1,131 @@
+import { DeviceType } from "./Runtime";
+
+// Precision data types distributed as a union
+export type _FullPrecisionDType = 'fp32';
+export type _HalfPrecisionDType = 'fp16';
+export type _8BitPrecisionDType = 'q8' | 'in8' | 'uint8';
+export type _4BitPrecisionDType = 'q4' | 'bnb4' | 'q4f16';
+
+// Combine into a full union
+export type DType = _FullPrecisionDType | _HalfPrecisionDType | _8BitPrecisionDType | _4BitPrecisionDType;
+
+/**
+ * Device configuration
+ */
+export interface DeviceConfig {
+  device?: DeviceType;
+  dtype?: DType;
+}
+
+/**
+ * Task type for the models
+ */
+type TaskType =
+'text-generation'
+| 'embedding-generation'
+| 'text-to-speech'
+| 'speech-to-text'
+
+/**
+ * Interface for the model
+ */
+export interface Model {
+  repository: string,
+  quantization: DType,
+  taskType: TaskType,
+  [key: string]: string,
+}
+
+/**
+ * Interfaces for supported models
+ */
+type LanguageModelsType =
+'onnx-community/DeepSeek-R1-Distill-Qwen-1.5B-ONNX'
+| 'onnx-community/Llama-3.2-1B-Instruct-q4f16'
+| 'HuggingFaceTB/SmolLM2-1.7B-Instruct'
+
+type VisionLanguageModelsType =
+'HuggingFaceTB/SmolVLM-256M-Instruct'
+
+type TextEmbeddingModelsType =
+'nomic-ai/nomic-embed-text-v1.5'
+
+type MultiModalEmbeddingModelsType =
+'jinaai/jina-clip-v1'
+
+type TextToSpeechModelsType =
+'onnx-community/Kokoro-82M-v1.0-ONNX'
+
+type SpeechToTextModelsType =
+'onnx-community/moonshine-base-ONNX'
+| 'onnx-community/whisper-tiny.en'
+
+/**
+ * Models Natively Supported by TinyLM
+ */
+type SupportedModelsType = LanguageModelsType | VisionLanguageModelsType | TextEmbeddingModelsType | MultiModalEmbeddingModelsType | TextToSpeechModelsType | SpeechToTextModelsType
+
+type ModelCatalogType = Record<SupportedModelsType, Model>
+
+
+/**
+ * Model Catalog - Maps all supported models to their configurations
+ */
+export const modelCatalog: ModelCatalogType = {
+  // Language Models
+  "onnx-community/DeepSeek-R1-Distill-Qwen-1.5B-ONNX": {
+    repository: "onnx-community/DeepSeek-R1-Distill-Qwen-1.5B-ONNX",
+    quantization: "fp16",
+    taskType: "text-generation",
+  },
+  "onnx-community/Llama-3.2-1B-Instruct-q4f16": {
+    repository: "onnx-community/Llama-3.2-1B-Instruct-q4f16",
+    quantization: "q4f16",
+    taskType: "text-generation",
+  },
+  "HuggingFaceTB/SmolLM2-1.7B-Instruct": {
+    repository: "HuggingFaceTB/SmolLM2-1.7B-Instruct",
+    quantization: "q8",
+    taskType: "text-generation",
+  },
+
+  // Vision Language Models
+  "HuggingFaceTB/SmolVLM-256M-Instruct": {
+    repository: "HuggingFaceTB/SmolVLM-256M-Instruct",
+    quantization: "fp16",
+    taskType: "text-generation",
+  },
+
+  // Text Embedding Models
+  "nomic-ai/nomic-embed-text-v1.5": {
+    repository: "nomic-ai/nomic-embed-text-v1.5",
+    quantization: "fp32",
+    taskType: "embedding-generation",
+  },
+
+  // Multi-Modal Embedding Models
+  "jinaai/jina-clip-v1": {
+    repository: "jinaai/jina-clip-v1",
+    quantization: "fp16",
+    taskType: "embedding-generation",
+  },
+
+  // Text-to-Speech Models
+  "onnx-community/Kokoro-82M-v1.0-ONNX": {
+    repository: "onnx-community/Kokoro-82M-v1.0-ONNX",
+    quantization: "fp32",
+    taskType: "text-to-speech",
+  },
+
+  // Speech-to-Text Models
+  "onnx-community/moonshine-base-ONNX": {
+    repository: "onnx-community/moonshine-base-ONNX",
+    quantization: "fp16",
+    taskType: "speech-to-text",
+  },
+  "onnx-community/whisper-tiny.en": {
+    repository: "onnx-community/whisper-tiny.en",
+    quantization: "q8",
+    taskType: "speech-to-text",
+  }
+}