Class: Aws::Bedrock::Types::RFTHyperParameters

Inherits:

Struct

Object
Struct
Aws::Bedrock::Types::RFTHyperParameters

show all

Includes:: Structure

Defined in:: lib/aws-sdk-bedrock/types.rb

Overview

Hyperparameters for controlling the reinforcement fine-tuning training process, including learning settings and evaluation intervals.

Constant Summary collapse

SENSITIVE =

[]

Instance Attribute Summary collapse

#batch_size ⇒ Integer

Number of training samples processed in each batch during reinforcement fine-tuning (RFT) training.
#epoch_count ⇒ Integer

Number of training epochs to run during reinforcement fine-tuning.
#eval_interval ⇒ Integer

Interval between evaluation runs during RFT training, measured in training steps.
#inference_max_tokens ⇒ Integer

Maximum number of tokens the model can generate in response to each prompt during RFT training.
#learning_rate ⇒ Float

Learning rate for the reinforcement fine-tuning.
#max_prompt_length ⇒ Integer

Maximum length of input prompts during RFT training, measured in tokens.
#reasoning_effort ⇒ String

Level of reasoning effort applied during RFT training.
#training_sample_per_prompt ⇒ Integer

Number of response samples generated per prompt during RFT training.

Instance Attribute Details

#batch_size ⇒ `Integer`

Number of training samples processed in each batch during reinforcement fine-tuning (RFT) training. Larger batches may improve training stability.

Returns:

(Integer)

# File 'lib/aws-sdk-bedrock/types.rb', line 11525

class RFTHyperParameters < Struct.new(
  :epoch_count,
  :batch_size,
  :learning_rate,
  :max_prompt_length,
  :training_sample_per_prompt,
  :inference_max_tokens,
  :reasoning_effort,
  :eval_interval)
  SENSITIVE = []
  include Aws::Structure
end

#epoch_count ⇒ `Integer`

Number of training epochs to run during reinforcement fine-tuning. Higher values may improve performance but increase training time.

Returns:

(Integer)

# File 'lib/aws-sdk-bedrock/types.rb', line 11525

class RFTHyperParameters < Struct.new(
  :epoch_count,
  :batch_size,
  :learning_rate,
  :max_prompt_length,
  :training_sample_per_prompt,
  :inference_max_tokens,
  :reasoning_effort,
  :eval_interval)
  SENSITIVE = []
  include Aws::Structure
end

#eval_interval ⇒ `Integer`

Interval between evaluation runs during RFT training, measured in training steps. More frequent evaluation provides better monitoring.

Returns:

(Integer)

# File 'lib/aws-sdk-bedrock/types.rb', line 11525

class RFTHyperParameters < Struct.new(
  :epoch_count,
  :batch_size,
  :learning_rate,
  :max_prompt_length,
  :training_sample_per_prompt,
  :inference_max_tokens,
  :reasoning_effort,
  :eval_interval)
  SENSITIVE = []
  include Aws::Structure
end

#inference_max_tokens ⇒ `Integer`

Maximum number of tokens the model can generate in response to each prompt during RFT training.

Returns:

(Integer)

# File 'lib/aws-sdk-bedrock/types.rb', line 11525

class RFTHyperParameters < Struct.new(
  :epoch_count,
  :batch_size,
  :learning_rate,
  :max_prompt_length,
  :training_sample_per_prompt,
  :inference_max_tokens,
  :reasoning_effort,
  :eval_interval)
  SENSITIVE = []
  include Aws::Structure
end

#learning_rate ⇒ `Float`

Learning rate for the reinforcement fine-tuning. Controls how quickly the model adapts to reward signals.

Returns:

(Float)

# File 'lib/aws-sdk-bedrock/types.rb', line 11525

class RFTHyperParameters < Struct.new(
  :epoch_count,
  :batch_size,
  :learning_rate,
  :max_prompt_length,
  :training_sample_per_prompt,
  :inference_max_tokens,
  :reasoning_effort,
  :eval_interval)
  SENSITIVE = []
  include Aws::Structure
end

#max_prompt_length ⇒ `Integer`

Maximum length of input prompts during RFT training, measured in tokens. Longer prompts allow more context but increase memory usage and training-time.

Returns:

(Integer)

# File 'lib/aws-sdk-bedrock/types.rb', line 11525

class RFTHyperParameters < Struct.new(
  :epoch_count,
  :batch_size,
  :learning_rate,
  :max_prompt_length,
  :training_sample_per_prompt,
  :inference_max_tokens,
  :reasoning_effort,
  :eval_interval)
  SENSITIVE = []
  include Aws::Structure
end

#reasoning_effort ⇒ `String`

Level of reasoning effort applied during RFT training. Higher values may improve response quality but increase training time.

Returns:

(String)

# File 'lib/aws-sdk-bedrock/types.rb', line 11525

class RFTHyperParameters < Struct.new(
  :epoch_count,
  :batch_size,
  :learning_rate,
  :max_prompt_length,
  :training_sample_per_prompt,
  :inference_max_tokens,
  :reasoning_effort,
  :eval_interval)
  SENSITIVE = []
  include Aws::Structure
end

#training_sample_per_prompt ⇒ `Integer`

Number of response samples generated per prompt during RFT training. More samples provide better reward signal estimation.

Returns:

(Integer)

# File 'lib/aws-sdk-bedrock/types.rb', line 11525

class RFTHyperParameters < Struct.new(
  :epoch_count,
  :batch_size,
  :learning_rate,
  :max_prompt_length,
  :training_sample_per_prompt,
  :inference_max_tokens,
  :reasoning_effort,
  :eval_interval)
  SENSITIVE = []
  include Aws::Structure
end

Class: Aws::Bedrock::Types::RFTHyperParameters

Overview

Constant Summary collapse

Instance Attribute Summary collapse

Instance Attribute Details

#batch_size ⇒ Integer

#epoch_count ⇒ Integer

#eval_interval ⇒ Integer

#inference_max_tokens ⇒ Integer

#learning_rate ⇒ Float

#max_prompt_length ⇒ Integer

#reasoning_effort ⇒ String

#training_sample_per_prompt ⇒ Integer

#batch_size ⇒ `Integer`

#epoch_count ⇒ `Integer`

#eval_interval ⇒ `Integer`

#inference_max_tokens ⇒ `Integer`

#learning_rate ⇒ `Float`

#max_prompt_length ⇒ `Integer`

#reasoning_effort ⇒ `String`

#training_sample_per_prompt ⇒ `Integer`