Skip to content
Merged
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
5 changes: 4 additions & 1 deletion openapi.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -7789,6 +7789,7 @@ components:
- GRPO_LOSS_AGGREGATION_TYPE_UNSPECIFIED
- GRPO_LOSS_AGGREGATION_TYPE_FIXED_HORIZON
- GRPO_LOSS_AGGREGATION_TYPE_TOKEN_MEAN
- GRPO_LOSS_AGGREGATION_TYPE_SEQUENCE_MEAN
default: GRPO_LOSS_AGGREGATION_TYPE_UNSPECIFIED
RL.LossConfig:
type: object
Expand Down Expand Up @@ -7900,12 +7901,14 @@ components:
properties:
target_tokens:
$ref: '#/components/schemas/RL.LossTargetTokens'
description: Target tokens for loss computation (optional, defaults to shifted input_ids)
description: Target tokens for loss computation
loss_mask:
$ref: '#/components/schemas/RL.LossMask'
description: Per-token loss mask (1=compute loss, 0=ignore)
grpo_inputs:
$ref: '#/components/schemas/RL.GRPOLossInputs'
required:
- target_tokens
RL.TrainingSample:
type: object
required:
Expand Down
Loading