@@ -7617,11 +7617,14 @@ components:
76177617 RL.SampleBody :
76187618 type : object
76197619 required :
7620- - prompt
7620+ - prompts
76217621 properties :
7622- prompt :
7623- $ref : ' #/components/schemas/RL.ModelInput'
7624- description : Input prompt as tokenized chunks
7622+ prompts :
7623+ description : Input prompts as tokenized chunks
7624+ type : array
7625+ items :
7626+ type : object
7627+ $ref : ' #/components/schemas/RL.ModelInput'
76257628 sampling_params :
76267629 $ref : ' #/components/schemas/RL.SamplingParams'
76277630 description : Optional sampling parameters
@@ -7630,7 +7633,7 @@ components:
76307633 format : int64
76317634 example : 1
76327635 default : " 1"
7633- description : Number of completions to generate for this prompt
7636+ description : Number of completions to generate per prompt
76347637 RL.ForwardBackwardBody :
76357638 type : object
76367639 required :
@@ -7714,6 +7717,10 @@ components:
77147717 type : boolean
77157718 example : true
77167719 description : Whether more items exist beyond this page
7720+ next_cursor :
7721+ type : string
7722+ example : 123e4567-e89b-12d3-a456-426614174000
7723+ description : Cursor to use as the 'after' parameter for the next page. Empty when has_more is false.
77177724 RL.EncodedText :
77187725 type : object
77197726 properties :
@@ -7943,14 +7950,23 @@ components:
79437950 format : uint64
79447951 example : 100
79457952 RL.SampleResult :
7953+ type : object
7954+ properties :
7955+ rollouts :
7956+ type : array
7957+ items :
7958+ type : object
7959+ $ref : ' #/components/schemas/RL.SampleRollout'
7960+ description : Completions grouped by prompt
7961+ RL.SampleRollout :
79467962 type : object
79477963 properties :
79487964 sequences :
79497965 type : array
79507966 items :
79517967 type : object
79527968 $ref : ' #/components/schemas/RL.SampleSequence'
7953- description : Generated completions
7969+ description : Completions generated for one prompt
79547970 RL.SampleSequence :
79557971 type : object
79567972 properties :
@@ -7998,11 +8014,15 @@ components:
79988014 properties :
79998015 loss :
80008016 type : number
8017+ format : double
80018018 example : 2.345
80028019 description : Loss value
80038020 metrics :
80048021 type : object
80058022 description : Loss-specific metrics (e.g., KL divergence, clip fraction for GRPO)
8023+ example :
8024+ loss/clip/high_fraction : 0.1
8025+ loss/kl_ref/mean : 0.05
80068026 additionalProperties :
80078027 type : number
80088028 format : double
0 commit comments