Implement largest tag as alias

ldmosquera · ldmosquera · commit 18978b534f34 · 2025-03-25T11:43:18.000-03:00
diff --git a/lib/ruby_llm/aliases.rb b/lib/ruby_llm/aliases.rb
@@ -19,13 +19,11 @@ class << self
       # @param provider_slug [String, Symbol, nil] optional provider to resolve for
       # @return [String] the resolved model ID or the original if no alias exists
       def resolve(model_id, provider = nil)
-        return model_id unless aliases[model_id]
-
         if provider
-          aliases[model_id][provider.to_s] || model_id
+          @runtime_aliases.dig(provider.to_s, model_id) || aliases.dig(model_id, provider.to_s) || model_id
         else
           # Get native provider's version
-          aliases[model_id].values.first || model_id
+          aliases[model_id]&.values&.first || model_id
         end
       end
 
@@ -35,6 +33,14 @@ def aliases
         @aliases ||= load_aliases
       end
 
+      # Adds extra runtime-only aliases for a specific provider
+      # @return [Hash] the updated aliases mapping
+      def register_runtime_aliases(provider, extra_aliases)
+        # NOTE: not persisted; will be gone after app restart
+        @runtime_aliases ||= {}
+        @runtime_aliases[provider.to_s] = extra_aliases
+      end
+
       # Loads aliases from the JSON file
       # @return [Hash] the loaded aliases
       def load_aliases
diff --git a/lib/ruby_llm/providers/ollama/models.rb b/lib/ruby_llm/providers/ollama/models.rb
@@ -10,13 +10,6 @@ def models_url
           'api/tags'
         end
 
-        # FIXME: include aliases for tags with the format \d+m or \d+b
-        # ie. given these models in the server,
-        # - gemma3:27b
-        # - gemma3:9b
-        #
-        # create an alias gemma3 for gemma3:27b
-
         # NOTE: Unlike other providers for well known APIs with stable model
         # offerings, the Ollama provider deals with local servers which
         # might have arbitrarily named models or even zero models installed.
@@ -38,7 +31,28 @@ def list_models
         private
 
         def parse_list_models_response(response, slug, capabilities) # rubocop:disable Metrics/MethodLength
-          (response.body['models'] || []).map do |model|
+          provider_aliases = {}
+          list = response.body['models'] || []
+
+          # initial pass: discover Ollama "tags"
+          list.each do |model|
+            base, tag = model['name'].split(':', 2)
+            model['model_name_base'] = base if tag
+          end
+
+          # second pass: set aliases for models with multiple sizes
+          list.group_by { |m| m['model_name_base'] }.each do |base, models|
+            # given these models in the server,
+            # - gemma3:27b
+            # - gemma3:9b
+            # then gemma3:27b will get the 'gemma3' alias since the 27b is larger in bytesize
+            largest = models.max_by { |m| m['size'].to_i }
+            provider_aliases[base] = largest['name']
+          end
+          RubyLLM::Aliases.register_runtime_aliases(slug, provider_aliases)
+
+          # final pass: assemble
+          list.map do |model|
             model_id = model['name']
 
             ModelInfo.new(
@@ -57,6 +71,7 @@ def parse_list_models_response(response, slug, capabilities) # rubocop:disable M
               input_price_per_million: capabilities.input_price_for(model_id),
               output_price_per_million: capabilities.output_price_for(model_id),
               metadata: {
+                model_name_base: model['model_name_base'],
                 byte_size: model['size']&.to_i,
                 parameter_size: model.dig('details', 'parameter_size'),
                 quantization_level: model.dig('details', 'quantization_level'),
diff --git a/spec/ruby_llm/providers/ollama/ollama_spec.rb b/spec/ruby_llm/providers/ollama/ollama_spec.rb
@@ -31,6 +31,11 @@
         an_object_having_attributes(provider: 'ollama', id: 'snowflake-arctic-embed:22m')
       )
     end
+
+    it 'aliases models to the largest available tag' do
+      chat = RubyLLM.chat(model: 'smollm', provider: 'ollama')
+      expect(chat.model.id).to eq('smollm:135m')
+    end
   end
 
   describe '.chat' do