Class: Aws::Bedrock::Types::RFTHyperParameters

Inherits:
Struct
  • Object
show all
Includes:
Structure
Defined in:
lib/aws-sdk-bedrock/types.rb

Overview

Hyperparameters for controlling the reinforcement fine-tuning training process, including learning settings and evaluation intervals.

Constant Summary collapse

SENSITIVE =
[]

Instance Attribute Summary collapse

Instance Attribute Details

#batch_sizeInteger

Number of training samples processed in each batch during reinforcement fine-tuning (RFT) training. Larger batches may improve training stability.

Returns:

  • (Integer)


11525
11526
11527
11528
11529
11530
11531
11532
11533
11534
11535
11536
# File 'lib/aws-sdk-bedrock/types.rb', line 11525

class RFTHyperParameters < Struct.new(
  :epoch_count,
  :batch_size,
  :learning_rate,
  :max_prompt_length,
  :training_sample_per_prompt,
  :inference_max_tokens,
  :reasoning_effort,
  :eval_interval)
  SENSITIVE = []
  include Aws::Structure
end

#epoch_countInteger

Number of training epochs to run during reinforcement fine-tuning. Higher values may improve performance but increase training time.

Returns:

  • (Integer)


11525
11526
11527
11528
11529
11530
11531
11532
11533
11534
11535
11536
# File 'lib/aws-sdk-bedrock/types.rb', line 11525

class RFTHyperParameters < Struct.new(
  :epoch_count,
  :batch_size,
  :learning_rate,
  :max_prompt_length,
  :training_sample_per_prompt,
  :inference_max_tokens,
  :reasoning_effort,
  :eval_interval)
  SENSITIVE = []
  include Aws::Structure
end

#eval_intervalInteger

Interval between evaluation runs during RFT training, measured in training steps. More frequent evaluation provides better monitoring.

Returns:

  • (Integer)


11525
11526
11527
11528
11529
11530
11531
11532
11533
11534
11535
11536
# File 'lib/aws-sdk-bedrock/types.rb', line 11525

class RFTHyperParameters < Struct.new(
  :epoch_count,
  :batch_size,
  :learning_rate,
  :max_prompt_length,
  :training_sample_per_prompt,
  :inference_max_tokens,
  :reasoning_effort,
  :eval_interval)
  SENSITIVE = []
  include Aws::Structure
end

#inference_max_tokensInteger

Maximum number of tokens the model can generate in response to each prompt during RFT training.

Returns:

  • (Integer)


11525
11526
11527
11528
11529
11530
11531
11532
11533
11534
11535
11536
# File 'lib/aws-sdk-bedrock/types.rb', line 11525

class RFTHyperParameters < Struct.new(
  :epoch_count,
  :batch_size,
  :learning_rate,
  :max_prompt_length,
  :training_sample_per_prompt,
  :inference_max_tokens,
  :reasoning_effort,
  :eval_interval)
  SENSITIVE = []
  include Aws::Structure
end

#learning_rateFloat

Learning rate for the reinforcement fine-tuning. Controls how quickly the model adapts to reward signals.

Returns:

  • (Float)


11525
11526
11527
11528
11529
11530
11531
11532
11533
11534
11535
11536
# File 'lib/aws-sdk-bedrock/types.rb', line 11525

class RFTHyperParameters < Struct.new(
  :epoch_count,
  :batch_size,
  :learning_rate,
  :max_prompt_length,
  :training_sample_per_prompt,
  :inference_max_tokens,
  :reasoning_effort,
  :eval_interval)
  SENSITIVE = []
  include Aws::Structure
end

#max_prompt_lengthInteger

Maximum length of input prompts during RFT training, measured in tokens. Longer prompts allow more context but increase memory usage and training-time.

Returns:

  • (Integer)


11525
11526
11527
11528
11529
11530
11531
11532
11533
11534
11535
11536
# File 'lib/aws-sdk-bedrock/types.rb', line 11525

class RFTHyperParameters < Struct.new(
  :epoch_count,
  :batch_size,
  :learning_rate,
  :max_prompt_length,
  :training_sample_per_prompt,
  :inference_max_tokens,
  :reasoning_effort,
  :eval_interval)
  SENSITIVE = []
  include Aws::Structure
end

#reasoning_effortString

Level of reasoning effort applied during RFT training. Higher values may improve response quality but increase training time.

Returns:

  • (String)


11525
11526
11527
11528
11529
11530
11531
11532
11533
11534
11535
11536
# File 'lib/aws-sdk-bedrock/types.rb', line 11525

class RFTHyperParameters < Struct.new(
  :epoch_count,
  :batch_size,
  :learning_rate,
  :max_prompt_length,
  :training_sample_per_prompt,
  :inference_max_tokens,
  :reasoning_effort,
  :eval_interval)
  SENSITIVE = []
  include Aws::Structure
end

#training_sample_per_promptInteger

Number of response samples generated per prompt during RFT training. More samples provide better reward signal estimation.

Returns:

  • (Integer)


11525
11526
11527
11528
11529
11530
11531
11532
11533
11534
11535
11536
# File 'lib/aws-sdk-bedrock/types.rb', line 11525

class RFTHyperParameters < Struct.new(
  :epoch_count,
  :batch_size,
  :learning_rate,
  :max_prompt_length,
  :training_sample_per_prompt,
  :inference_max_tokens,
  :reasoning_effort,
  :eval_interval)
  SENSITIVE = []
  include Aws::Structure
end