File tree Expand file tree Collapse file tree 1 file changed +3
-59
lines changed
Expand file tree Collapse file tree 1 file changed +3
-59
lines changed Original file line number Diff line number Diff line change @@ -7462,6 +7462,7 @@ components:
74627462 RL.CrossEntropyLossParams :
74637463 type : object
74647464 description : Cross-entropy loss parameters (currently empty).
7465+ properties : {}
74657466 RL.GRPOLossParams :
74667467 type : object
74677468 properties :
@@ -7596,61 +7597,6 @@ components:
75967597 description : Per-token loss mask (1=compute loss, 0=ignore)
75977598 grpo_inputs :
75987599 $ref : ' #/components/schemas/RL.GRPOLossInputs'
7599- RL.LossFn :
7600- type : string
7601- default : LOSS_FN_UNSPECIFIED
7602- enum :
7603- - LOSS_FN_UNSPECIFIED
7604- - LOSS_FN_GRPO
7605- RL.LossFnInputs :
7606- type : object
7607- required :
7608- - weights
7609- - target_tokens
7610- properties :
7611- weights :
7612- $ref : ' #/components/schemas/RL.LossFnWeights'
7613- description : Per-token weights
7614- target_tokens :
7615- $ref : ' #/components/schemas/RL.LossFnTargetTokens'
7616- description : Target tokens for loss computation
7617- RL.LossFnTargetTokens :
7618- type : object
7619- required :
7620- - data
7621- properties :
7622- data :
7623- description : Integer array of target tokens
7624- type : array
7625- example :
7626- - 123
7627- - 456
7628- - 789
7629- items :
7630- type : number
7631- dtype :
7632- description : Data type of the integer array
7633- $ref : ' #/components/schemas/RL.DType'
7634- example : D_TYPE_INT64
7635- RL.LossFnWeights :
7636- type : object
7637- required :
7638- - data
7639- properties :
7640- data :
7641- description : Float array of per-token weights
7642- type : array
7643- example :
7644- - 0.1
7645- - 0.2
7646- - 0.3
7647- items :
7648- type : number
7649- format : float
7650- dtype :
7651- description : Data type of the float array
7652- $ref : ' #/components/schemas/RL.DType'
7653- example : D_TYPE_FLOAT32
76547600 RL.TrainingSample :
76557601 type : object
76567602 required :
@@ -7718,8 +7664,7 @@ components:
77187664 - 456
77197665 - 789
77207666 items :
7721- type : string
7722- format : int64
7667+ type : integer
77237668 description : Generated token IDs
77247669 logprobs :
77257670 type : array
@@ -7728,8 +7673,7 @@ components:
77287673 - -1.2
77297674 - -0.3
77307675 items :
7731- type : number
7732- format : double
7676+ type : integer
77337677 description : Log probabilities for each generated token
77347678 stop_reason :
77357679 type : string
You can’t perform that action at this time.
0 commit comments