Class: Google::Cloud::AIPlatform::V1::GenerationConfig::RoutingConfig

Inherits:
Object
  • Object
show all
Extended by:
Protobuf::MessageExts::ClassMethods
Includes:
Protobuf::MessageExts
Defined in:
proto_docs/google/cloud/aiplatform/v1/content.rb

Overview

The configuration for routing the request to a specific model.

Defined Under Namespace

Classes: AutoRoutingMode, ManualRoutingMode

Instance Attribute Summary collapse

Instance Attribute Details

#auto_mode::Google::Cloud::AIPlatform::V1::GenerationConfig::RoutingConfig::AutoRoutingMode

Returns Automated routing.

Note: The following fields are mutually exclusive: auto_mode, manual_mode. If a field in that set is populated, all other fields in the set will automatically be cleared.

Returns:



209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
# File 'proto_docs/google/cloud/aiplatform/v1/content.rb', line 209

class RoutingConfig
  include ::Google::Protobuf::MessageExts
  extend ::Google::Protobuf::MessageExts::ClassMethods

  # When automated routing is specified, the routing will be determined by
  # the pretrained routing model and customer provided model routing
  # preference.
  # @!attribute [rw] model_routing_preference
  #   @return [::Google::Cloud::AIPlatform::V1::GenerationConfig::RoutingConfig::AutoRoutingMode::ModelRoutingPreference]
  #     The model routing preference.
  class AutoRoutingMode
    include ::Google::Protobuf::MessageExts
    extend ::Google::Protobuf::MessageExts::ClassMethods

    # The model routing preference.
    module ModelRoutingPreference
      # Unspecified model routing preference.
      UNKNOWN = 0

      # Prefer higher quality over low cost.
      PRIORITIZE_QUALITY = 1

      # Balanced model routing preference.
      BALANCED = 2

      # Prefer lower cost over higher quality.
      PRIORITIZE_COST = 3
    end
  end

  # When manual routing is set, the specified model will be used directly.
  # @!attribute [rw] model_name
  #   @return [::String]
  #     The model name to use. Only the public LLM models are accepted. e.g.
  #     'gemini-1.5-pro-001'.
  class ManualRoutingMode
    include ::Google::Protobuf::MessageExts
    extend ::Google::Protobuf::MessageExts::ClassMethods
  end
end

#manual_mode::Google::Cloud::AIPlatform::V1::GenerationConfig::RoutingConfig::ManualRoutingMode

Returns Manual routing.

Note: The following fields are mutually exclusive: manual_mode, auto_mode. If a field in that set is populated, all other fields in the set will automatically be cleared.

Returns:



209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
# File 'proto_docs/google/cloud/aiplatform/v1/content.rb', line 209

class RoutingConfig
  include ::Google::Protobuf::MessageExts
  extend ::Google::Protobuf::MessageExts::ClassMethods

  # When automated routing is specified, the routing will be determined by
  # the pretrained routing model and customer provided model routing
  # preference.
  # @!attribute [rw] model_routing_preference
  #   @return [::Google::Cloud::AIPlatform::V1::GenerationConfig::RoutingConfig::AutoRoutingMode::ModelRoutingPreference]
  #     The model routing preference.
  class AutoRoutingMode
    include ::Google::Protobuf::MessageExts
    extend ::Google::Protobuf::MessageExts::ClassMethods

    # The model routing preference.
    module ModelRoutingPreference
      # Unspecified model routing preference.
      UNKNOWN = 0

      # Prefer higher quality over low cost.
      PRIORITIZE_QUALITY = 1

      # Balanced model routing preference.
      BALANCED = 2

      # Prefer lower cost over higher quality.
      PRIORITIZE_COST = 3
    end
  end

  # When manual routing is set, the specified model will be used directly.
  # @!attribute [rw] model_name
  #   @return [::String]
  #     The model name to use. Only the public LLM models are accepted. e.g.
  #     'gemini-1.5-pro-001'.
  class ManualRoutingMode
    include ::Google::Protobuf::MessageExts
    extend ::Google::Protobuf::MessageExts::ClassMethods
  end
end