diff --git a/pyproject.toml b/pyproject.toml index 36b6a33..6890fb5 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -21,6 +21,7 @@ dependencies = [ "numpy>=1.24.0", "torch>=2.4.0", "transformers>=4.40.0", + "bitsandbytes>=0.46.1", "accelerate>=0.26.0", "huggingface-hub>=0.23.0", "datasets>=2.14.0", @@ -32,6 +33,13 @@ dependencies = [ "wonderwords>=2.2.0", "openai>=1.0.0", "tiktoken>=0.7.0", + "python-dotenv>=1.0.0", + "auto-gptq>=0.5.0", + "optimum>=1.16.0", + "mamba-ssm>=1.0.0", + "compressed-tensors>=0.1.0", + "mlx>=0.10.0", + "mlx-lm>=0.10.0", ] [project.optional-dependencies] diff --git a/src/llm_dna/models/ModelLoader.py b/src/llm_dna/models/ModelLoader.py index f3c8b65..b2c52ee 100644 --- a/src/llm_dna/models/ModelLoader.py +++ b/src/llm_dna/models/ModelLoader.py @@ -82,7 +82,9 @@ def _detect_model_type(self, model_path_or_name: str) -> str: "cohere/command", "perplexity/", ] - if any(model_lower.startswith(prefix) for prefix in openrouter_prefixes): + huggingface_prefixes_openai = "openai/gpt-oss" + + if any(model_lower.startswith(prefix) for prefix in openrouter_prefixes) and not model_lower.startswith(huggingface_prefixes_openai): return "openrouter" # Check for Google Gemini model names