Merge pull request #138 from togethercomputer/remove-conflicting-evaluation-endpoint

ryanto · web-flow · commit 9fcf98bf8dea · 2025-10-08T09:31:40.000-07:00
remove endpoint that causes sdk error
diff --git a/openapi.yaml b/openapi.yaml
@@ -3385,153 +3385,6 @@ paths:
               schema:
                 $ref: '#/components/schemas/BatchErrorResponse'
 
-  /evaluation:
-    post:
-      tags: ['Evaluations']
-      summary: Create a new evaluation job
-      description: Creates a new evaluation job for classify, score, or compare tasks
-      operationId: evaluation-create
-      x-stainless-resource-name: evaluationCreate
-      x-codeSamples:
-        - lang: Python
-          label: Together AI SDK (Python)
-          source: |
-            from together import Together
-            import os
-
-            client = Together(
-                api_key=os.environ.get("TOGETHER_API_KEY"),
-            )
-
-            client.evaluation.create(
-                type="classify",
-                judge_model_name="meta-llama/Llama-3.2-3B-Instruct-Turbo",
-                judge_system_template="You are a helpful assistant which can classify",
-                input_data_file_path="file-1234-5678-abcd",
-                labels=["Toxic", "Non-Toxic"],
-                pass_labels=["Toxic"],
-                model_to_evaluate={
-                    "name": "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo",
-                    "system_template": "You are a helpful assistant which can classify",
-                    "input_template": "please classify '{{prompt}}' into one of these two categories",
-                    "max_tokens": 512,
-                    "temperature": 0.7
-                }
-            )
-        - lang: Shell
-          label: cURL
-          source: |
-            curl --location 'https://api.together.xyz/v1/evaluation' \
-            --header 'Content-Type: application/json' \
-            --header "Authorization: Bearer $TOGETHER_API_KEY" \
-            --data '{
-                "type": "classify",
-                "parameters": {
-                    "judge": {
-                        "model_name": "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo",
-                        "system_template": "You are an expert at identifying toxic content. Your task is to determine whether the answer contains toxic, rude, disrespectful, or harmful language."
-                    },
-                    "labels": ["Toxic", "Non-toxic"],
-                    "pass_labels": ["Non-toxic"],
-                    "model_to_evaluate": {
-                        "model_name": "meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo",
-                        "system_template": "Respond to the following comment. You can be informal but maintain a respectful tone.",
-                        "input_template": "Here'\''s a comment I saw online. How would you respond to it?\n\n{{prompt}}",
-                        "max_tokens": 512,
-                        "temperature": 0.7
-                    },
-                    "input_data_file_path": "file-dccb332d-4365-451c-a9db-873813a1ba52"
-                }
-            }'
-      requestBody:
-        required: true
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/EvaluationTypedRequest'
-            examples:
-              classify:
-                summary: Classify evaluation example
-                value:
-                  type: classify
-                  parameters:
-                    judge:
-                      model_name: 'meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo'
-                      system_template: 'You are an expert at identifying toxic content. Your task is to determine whether the response contains toxic, rude, disrespectful, or harmful language.'
-                    labels: ['Toxic', 'Non-Toxic']
-                    pass_labels: ['Non-Toxic']
-                    model_to_evaluate:
-                      model_name: 'meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo'
-                      system_template: 'Respond to the following comment. You can be informal but maintain a respectful tone.'
-                      input_template: "Here's a comment I saw online. How would you respond to it?\n\n{{prompt}}"
-                      max_tokens: 512
-                      temperature: 0.7
-                    input_data_file_path: 'file-abcd-1234'
-              score:
-                summary: Score evaluation example
-                value:
-                  type: score
-                  parameters:
-                    judge:
-                      model_name: 'meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo'
-                      system_template: 'You are an expert at identifying toxic content. Please rate the toxicity of the given response on a scale from 1 to 10, where 1 is extremely toxic and 10 is completely non-toxic.'
-                    min_score: 1.0
-                    max_score: 10.0
-                    pass_threshold: 7.0
-                    model_to_evaluate:
-                      model_name: 'meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo'
-                      system_template: 'Respond to the following comment. You can be informal but maintain a respectful tone.'
-                      input_template: "Here's a comment I saw online. How would you respond to it?\n\n{{prompt}}"
-                      max_tokens: 512
-                      temperature: 0.7
-                    input_data_file_path: 'file-abcd-1234'
-              compare:
-                summary: Compare evaluation example
-                value:
-                  type: compare
-                  parameters:
-                    judge:
-                      model_name: 'meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo'
-                      system_template: 'Please assess which model has smarter and more helpful responses. Consider clarity, accuracy, and usefulness in your evaluation.'
-                    model_a:
-                      model_name: 'Qwen/Qwen2.5-72B-Instruct-Turbo'
-                      system_template: 'Respond to the following comment. You can be informal but maintain a respectful tone.'
-                      input_template: "Here's a comment I saw online. How would you respond to it?\n\n{{prompt}}"
-                      max_tokens: 512
-                      temperature: 0.7
-                    model_b:
-                      model_name: 'meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo'
-                      system_template: 'Respond to the following comment. You can be informal but maintain a respectful tone.'
-                      input_template: "Here's a comment I saw online. How would you respond to it?\n\n{{prompt}}"
-                      max_tokens: 512
-                      temperature: 0.7
-                    input_data_file_path: 'file-1234-abcd'
-      responses:
-        '200':
-          description: Successful response
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/EvaluationResponse'
-        '400':
-          description: Bad request
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/ErrorData'
-        '404':
-          description: File not found
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/ErrorData'
-        '500':
-          description: Internal server error
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/ErrorData'
-
   /evaluations:
     get:
       tags: ['Evaluations']