Class: Google::Cloud::AIPlatform::V1::GenerationConfig::RoutingConfig

Inherits:
Object
  • Object
show all
Extended by:
Protobuf::MessageExts::ClassMethods
Includes:
Protobuf::MessageExts
Defined in:
proto_docs/google/cloud/aiplatform/v1/content.rb

Overview

The configuration for routing the request to a specific model.

Defined Under Namespace

Classes: AutoRoutingMode, ManualRoutingMode

Instance Attribute Summary collapse

Instance Attribute Details

#auto_mode::Google::Cloud::AIPlatform::V1::GenerationConfig::RoutingConfig::AutoRoutingMode

Returns Automated routing.

Note: The following fields are mutually exclusive: auto_mode, manual_mode. If a field in that set is populated, all other fields in the set will automatically be cleared.

Returns:



361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
# File 'proto_docs/google/cloud/aiplatform/v1/content.rb', line 361

class RoutingConfig
  include ::Google::Protobuf::MessageExts
  extend ::Google::Protobuf::MessageExts::ClassMethods

  # When automated routing is specified, the routing will be determined by
  # the pretrained routing model and customer provided model routing
  # preference.
  # @!attribute [rw] model_routing_preference
  #   @return [::Google::Cloud::AIPlatform::V1::GenerationConfig::RoutingConfig::AutoRoutingMode::ModelRoutingPreference]
  #     The model routing preference.
  class AutoRoutingMode
    include ::Google::Protobuf::MessageExts
    extend ::Google::Protobuf::MessageExts::ClassMethods

    # The model routing preference.
    module ModelRoutingPreference
      # Unspecified model routing preference.
      UNKNOWN = 0

      # Prefer higher quality over low cost.
      PRIORITIZE_QUALITY = 1

      # Balanced model routing preference.
      BALANCED = 2

      # Prefer lower cost over higher quality.
      PRIORITIZE_COST = 3
    end
  end

  # When manual routing is set, the specified model will be used directly.
  # @!attribute [rw] model_name
  #   @return [::String]
  #     The model name to use. Only the public LLM models are accepted. e.g.
  #     'gemini-1.5-pro-001'.
  class ManualRoutingMode
    include ::Google::Protobuf::MessageExts
    extend ::Google::Protobuf::MessageExts::ClassMethods
  end
end

#manual_mode::Google::Cloud::AIPlatform::V1::GenerationConfig::RoutingConfig::ManualRoutingMode

Returns Manual routing.

Note: The following fields are mutually exclusive: manual_mode, auto_mode. If a field in that set is populated, all other fields in the set will automatically be cleared.

Returns:



361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
# File 'proto_docs/google/cloud/aiplatform/v1/content.rb', line 361

class RoutingConfig
  include ::Google::Protobuf::MessageExts
  extend ::Google::Protobuf::MessageExts::ClassMethods

  # When automated routing is specified, the routing will be determined by
  # the pretrained routing model and customer provided model routing
  # preference.
  # @!attribute [rw] model_routing_preference
  #   @return [::Google::Cloud::AIPlatform::V1::GenerationConfig::RoutingConfig::AutoRoutingMode::ModelRoutingPreference]
  #     The model routing preference.
  class AutoRoutingMode
    include ::Google::Protobuf::MessageExts
    extend ::Google::Protobuf::MessageExts::ClassMethods

    # The model routing preference.
    module ModelRoutingPreference
      # Unspecified model routing preference.
      UNKNOWN = 0

      # Prefer higher quality over low cost.
      PRIORITIZE_QUALITY = 1

      # Balanced model routing preference.
      BALANCED = 2

      # Prefer lower cost over higher quality.
      PRIORITIZE_COST = 3
    end
  end

  # When manual routing is set, the specified model will be used directly.
  # @!attribute [rw] model_name
  #   @return [::String]
  #     The model name to use. Only the public LLM models are accepted. e.g.
  #     'gemini-1.5-pro-001'.
  class ManualRoutingMode
    include ::Google::Protobuf::MessageExts
    extend ::Google::Protobuf::MessageExts::ClassMethods
  end
end