Get Evaluation Results#
To get evaluation results as a JSON response, send a GET
request to the evaluation/jobs/<job_id>/results
endpoint. You must provide the ID of the job as shown in the following code.
To Get Evaluation Results#
Choose one of the following options to get evaluation results.
import os
from nemo_microservices import NeMoMicroservices
# Initialize the client
client = NeMoMicroservices(
base_url=os.environ['EVALUATOR_BASE_URL']
)
# Get job results
results = client.evaluation.jobs.results("job-id")
# Access the results
print(f"Result ID: {results.id}")
print(f"Job ID: {results.job}")
print(f"Tasks: {results.tasks}")
print(f"Groups: {results.groups}")
curl -X "GET" "${EVALUATOR_BASE_URL}/evaluation/jobs/<job-id>/results" \
-H 'accept: application/json'
Example Response
{
"created_at": "2025-03-19T22:53:43.619932",
"updated_at": "2025-03-19T22:53:43.619934",
"id": "evaluation_result-1234ABCD5678EFGH",
"job": "eval-UVW123XYZ456",
"tasks": {
"exact_match": {
"metrics": {
"exact_match": {
"scores": {
"gsm8k-metric_ranking-1": {
"value": 0.0
},
"gsm8k-metric_ranking-3": {
"value": 0.8
}
}
}
}
},
"exact_match_stderr": {
"metrics": {
"exact_match_stderr": {
"scores": {
"gsm8k-metric_ranking-2": {
"value": 0.0
},
"gsm8k-metric_ranking-4": {
"value": 0.19999999999999998
}
}
}
}
}
},
"groups": {
"evaluation": {
"metrics": {
"evaluation": {
"scores": {
"exact_match": {
"value": 0.4
},
"exact_match_stderr": {
"value": 0.09999999999999999
}
}
}
}
}
},
"namespace": "default",
"custom_fields": {}
}