Requête sur les résultats d’évaluation

curl --request POST \
  --url https://api.example.com/v2/{entity}/{project}/eval_results/query \
  --header 'Content-Type: application/json' \
  --data '
{
  "evaluation_call_ids": [
    "<string>"
  ],
  "evaluation_run_ids": [
    "<string>"
  ],
  "filter_logic_operator": "or",
  "filters": [
    {
      "query": {
        "$expr": {
          "$and": [
            {
              "$literal": "<string>"
            }
          ]
        }
      },
      "evaluation_call_id": "<string>"
    }
  ],
  "include_costs": false,
  "include_predict_and_score_children": true,
  "include_raw_data_rows": false,
  "include_rows": true,
  "include_summary": false,
  "limit": 123,
  "offset": 0,
  "require_intersection": false,
  "resolve_row_refs": false,
  "sort_by": [
    {
      "field": "<string>",
      "evaluation_call_id": "<string>",
      "mode": "value"
    }
  ],
  "summary_require_intersection": true
}
'

import requests

url = "https://api.example.com/v2/{entity}/{project}/eval_results/query"

payload = {
    "evaluation_call_ids": ["<string>"],
    "evaluation_run_ids": ["<string>"],
    "filter_logic_operator": "or",
    "filters": [
        {
            "query": { "$expr": { "$and": [{ "$literal": "<string>" }] } },
            "evaluation_call_id": "<string>"
        }
    ],
    "include_costs": False,
    "include_predict_and_score_children": True,
    "include_raw_data_rows": False,
    "include_rows": True,
    "include_summary": False,
    "limit": 123,
    "offset": 0,
    "require_intersection": False,
    "resolve_row_refs": False,
    "sort_by": [
        {
            "field": "<string>",
            "evaluation_call_id": "<string>",
            "mode": "value"
        }
    ],
    "summary_require_intersection": True
}
headers = {"Content-Type": "application/json"}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {'Content-Type': 'application/json'},
  body: JSON.stringify({
    evaluation_call_ids: ['<string>'],
    evaluation_run_ids: ['<string>'],
    filter_logic_operator: 'or',
    filters: [
      {
        query: {$expr: {$and: [{$literal: '<string>'}]}},
        evaluation_call_id: '<string>'
      }
    ],
    include_costs: false,
    include_predict_and_score_children: true,
    include_raw_data_rows: false,
    include_rows: true,
    include_summary: false,
    limit: 123,
    offset: 0,
    require_intersection: false,
    resolve_row_refs: false,
    sort_by: [{field: '<string>', evaluation_call_id: '<string>', mode: 'value'}],
    summary_require_intersection: true
  })
};

fetch('https://api.example.com/v2/{entity}/{project}/eval_results/query', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.example.com/v2/{entity}/{project}/eval_results/query",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'evaluation_call_ids' => [
        '<string>'
    ],
    'evaluation_run_ids' => [
        '<string>'
    ],
    'filter_logic_operator' => 'or',
    'filters' => [
        [
                'query' => [
                                '$expr' => [
                                                                '$and' => [
                                                                                                                                [
                                                                                                                                                                                                                                                                '$literal' => '<string>'
                                                                                                                                ]
                                                                ]
                                ]
                ],
                'evaluation_call_id' => '<string>'
        ]
    ],
    'include_costs' => false,
    'include_predict_and_score_children' => true,
    'include_raw_data_rows' => false,
    'include_rows' => true,
    'include_summary' => false,
    'limit' => 123,
    'offset' => 0,
    'require_intersection' => false,
    'resolve_row_refs' => false,
    'sort_by' => [
        [
                'field' => '<string>',
                'evaluation_call_id' => '<string>',
                'mode' => 'value'
        ]
    ],
    'summary_require_intersection' => true
  ]),
  CURLOPT_HTTPHEADER => [
    "Content-Type: application/json"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.example.com/v2/{entity}/{project}/eval_results/query"

	payload := strings.NewReader("{\n  \"evaluation_call_ids\": [\n    \"<string>\"\n  ],\n  \"evaluation_run_ids\": [\n    \"<string>\"\n  ],\n  \"filter_logic_operator\": \"or\",\n  \"filters\": [\n    {\n      \"query\": {\n        \"$expr\": {\n          \"$and\": [\n            {\n              \"$literal\": \"<string>\"\n            }\n          ]\n        }\n      },\n      \"evaluation_call_id\": \"<string>\"\n    }\n  ],\n  \"include_costs\": false,\n  \"include_predict_and_score_children\": true,\n  \"include_raw_data_rows\": false,\n  \"include_rows\": true,\n  \"include_summary\": false,\n  \"limit\": 123,\n  \"offset\": 0,\n  \"require_intersection\": false,\n  \"resolve_row_refs\": false,\n  \"sort_by\": [\n    {\n      \"field\": \"<string>\",\n      \"evaluation_call_id\": \"<string>\",\n      \"mode\": \"value\"\n    }\n  ],\n  \"summary_require_intersection\": true\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.example.com/v2/{entity}/{project}/eval_results/query")
  .header("Content-Type", "application/json")
  .body("{\n  \"evaluation_call_ids\": [\n    \"<string>\"\n  ],\n  \"evaluation_run_ids\": [\n    \"<string>\"\n  ],\n  \"filter_logic_operator\": \"or\",\n  \"filters\": [\n    {\n      \"query\": {\n        \"$expr\": {\n          \"$and\": [\n            {\n              \"$literal\": \"<string>\"\n            }\n          ]\n        }\n      },\n      \"evaluation_call_id\": \"<string>\"\n    }\n  ],\n  \"include_costs\": false,\n  \"include_predict_and_score_children\": true,\n  \"include_raw_data_rows\": false,\n  \"include_rows\": true,\n  \"include_summary\": false,\n  \"limit\": 123,\n  \"offset\": 0,\n  \"require_intersection\": false,\n  \"resolve_row_refs\": false,\n  \"sort_by\": [\n    {\n      \"field\": \"<string>\",\n      \"evaluation_call_id\": \"<string>\",\n      \"mode\": \"value\"\n    }\n  ],\n  \"summary_require_intersection\": true\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.example.com/v2/{entity}/{project}/eval_results/query")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Content-Type"] = 'application/json'
request.body = "{\n  \"evaluation_call_ids\": [\n    \"<string>\"\n  ],\n  \"evaluation_run_ids\": [\n    \"<string>\"\n  ],\n  \"filter_logic_operator\": \"or\",\n  \"filters\": [\n    {\n      \"query\": {\n        \"$expr\": {\n          \"$and\": [\n            {\n              \"$literal\": \"<string>\"\n            }\n          ]\n        }\n      },\n      \"evaluation_call_id\": \"<string>\"\n    }\n  ],\n  \"include_costs\": false,\n  \"include_predict_and_score_children\": true,\n  \"include_raw_data_rows\": false,\n  \"include_rows\": true,\n  \"include_summary\": false,\n  \"limit\": 123,\n  \"offset\": 0,\n  \"require_intersection\": false,\n  \"resolve_row_refs\": false,\n  \"sort_by\": [\n    {\n      \"field\": \"<string>\",\n      \"evaluation_call_id\": \"<string>\",\n      \"mode\": \"value\"\n    }\n  ],\n  \"summary_require_intersection\": true\n}"

response = http.request(request)
puts response.read_body

{
  "rows": [
    {
      "row_digest": "<string>",
      "evaluations": [
        {
          "evaluation_call_id": "<string>",
          "trials": [
            {
              "predict_and_score_call_id": "<string>",
              "genai_span_ref": [
                {
                  "span_id": "<string>",
                  "trace_id": "<string>"
                }
              ],
              "model_latency_seconds": 123,
              "model_output": null,
              "predict_call_id": "<string>",
              "scorer_call_ids": {},
              "scores": {},
              "total_cost": 123,
              "total_tokens": 123
            }
          ]
        }
      ],
      "raw_data_row": null
    }
  ],
  "total_rows": 123,
  "summary": {
    "evaluations": [
      {
        "evaluation_call_id": "<string>",
        "display_name": "<string>",
        "evaluation_ref": "<string>",
        "model_ref": "<string>",
        "predict_total_cost": 123,
        "predict_total_tokens": 123,
        "scorer_stats": [
          {
            "scorer_key": "<string>",
            "numeric_count": 0,
            "numeric_mean": 123,
            "pass_known_count": 0,
            "pass_rate": 123,
            "pass_signal_coverage": 123,
            "pass_true_count": 0,
            "path": "<string>",
            "trial_count": 0
          }
        ],
        "started_at": "<string>",
        "trace_id": "<string>",
        "trial_count": 0
      }
    ],
    "row_count": 0
  },
  "warnings": [
    "<string>"
  ]
}

{
  "detail": [
    {
      "loc": [
        "<string>"
      ],
      "msg": "<string>",
      "type": "<string>"
    }
  ]
}

POST

{entity}

{project}

eval_results

query

Requête sur les résultats d’évaluation

curl --request POST \
  --url https://api.example.com/v2/{entity}/{project}/eval_results/query \
  --header 'Content-Type: application/json' \
  --data '
{
  "evaluation_call_ids": [
    "<string>"
  ],
  "evaluation_run_ids": [
    "<string>"
  ],
  "filter_logic_operator": "or",
  "filters": [
    {
      "query": {
        "$expr": {
          "$and": [
            {
              "$literal": "<string>"
            }
          ]
        }
      },
      "evaluation_call_id": "<string>"
    }
  ],
  "include_costs": false,
  "include_predict_and_score_children": true,
  "include_raw_data_rows": false,
  "include_rows": true,
  "include_summary": false,
  "limit": 123,
  "offset": 0,
  "require_intersection": false,
  "resolve_row_refs": false,
  "sort_by": [
    {
      "field": "<string>",
      "evaluation_call_id": "<string>",
      "mode": "value"
    }
  ],
  "summary_require_intersection": true
}
'

import requests

url = "https://api.example.com/v2/{entity}/{project}/eval_results/query"

payload = {
    "evaluation_call_ids": ["<string>"],
    "evaluation_run_ids": ["<string>"],
    "filter_logic_operator": "or",
    "filters": [
        {
            "query": { "$expr": { "$and": [{ "$literal": "<string>" }] } },
            "evaluation_call_id": "<string>"
        }
    ],
    "include_costs": False,
    "include_predict_and_score_children": True,
    "include_raw_data_rows": False,
    "include_rows": True,
    "include_summary": False,
    "limit": 123,
    "offset": 0,
    "require_intersection": False,
    "resolve_row_refs": False,
    "sort_by": [
        {
            "field": "<string>",
            "evaluation_call_id": "<string>",
            "mode": "value"
        }
    ],
    "summary_require_intersection": True
}
headers = {"Content-Type": "application/json"}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {'Content-Type': 'application/json'},
  body: JSON.stringify({
    evaluation_call_ids: ['<string>'],
    evaluation_run_ids: ['<string>'],
    filter_logic_operator: 'or',
    filters: [
      {
        query: {$expr: {$and: [{$literal: '<string>'}]}},
        evaluation_call_id: '<string>'
      }
    ],
    include_costs: false,
    include_predict_and_score_children: true,
    include_raw_data_rows: false,
    include_rows: true,
    include_summary: false,
    limit: 123,
    offset: 0,
    require_intersection: false,
    resolve_row_refs: false,
    sort_by: [{field: '<string>', evaluation_call_id: '<string>', mode: 'value'}],
    summary_require_intersection: true
  })
};

fetch('https://api.example.com/v2/{entity}/{project}/eval_results/query', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

<?php

$curl = curl_init();

curl_setopt_array($curl, [
  CURLOPT_URL => "https://api.example.com/v2/{entity}/{project}/eval_results/query",
  CURLOPT_RETURNTRANSFER => true,
  CURLOPT_ENCODING => "",
  CURLOPT_MAXREDIRS => 10,
  CURLOPT_TIMEOUT => 30,
  CURLOPT_HTTP_VERSION => CURL_HTTP_VERSION_1_1,
  CURLOPT_CUSTOMREQUEST => "POST",
  CURLOPT_POSTFIELDS => json_encode([
    'evaluation_call_ids' => [
        '<string>'
    ],
    'evaluation_run_ids' => [
        '<string>'
    ],
    'filter_logic_operator' => 'or',
    'filters' => [
        [
                'query' => [
                                '$expr' => [
                                                                '$and' => [
                                                                                                                                [
                                                                                                                                                                                                                                                                '$literal' => '<string>'
                                                                                                                                ]
                                                                ]
                                ]
                ],
                'evaluation_call_id' => '<string>'
        ]
    ],
    'include_costs' => false,
    'include_predict_and_score_children' => true,
    'include_raw_data_rows' => false,
    'include_rows' => true,
    'include_summary' => false,
    'limit' => 123,
    'offset' => 0,
    'require_intersection' => false,
    'resolve_row_refs' => false,
    'sort_by' => [
        [
                'field' => '<string>',
                'evaluation_call_id' => '<string>',
                'mode' => 'value'
        ]
    ],
    'summary_require_intersection' => true
  ]),
  CURLOPT_HTTPHEADER => [
    "Content-Type: application/json"
  ],
]);

$response = curl_exec($curl);
$err = curl_error($curl);

curl_close($curl);

if ($err) {
  echo "cURL Error #:" . $err;
} else {
  echo $response;
}

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.example.com/v2/{entity}/{project}/eval_results/query"

	payload := strings.NewReader("{\n  \"evaluation_call_ids\": [\n    \"<string>\"\n  ],\n  \"evaluation_run_ids\": [\n    \"<string>\"\n  ],\n  \"filter_logic_operator\": \"or\",\n  \"filters\": [\n    {\n      \"query\": {\n        \"$expr\": {\n          \"$and\": [\n            {\n              \"$literal\": \"<string>\"\n            }\n          ]\n        }\n      },\n      \"evaluation_call_id\": \"<string>\"\n    }\n  ],\n  \"include_costs\": false,\n  \"include_predict_and_score_children\": true,\n  \"include_raw_data_rows\": false,\n  \"include_rows\": true,\n  \"include_summary\": false,\n  \"limit\": 123,\n  \"offset\": 0,\n  \"require_intersection\": false,\n  \"resolve_row_refs\": false,\n  \"sort_by\": [\n    {\n      \"field\": \"<string>\",\n      \"evaluation_call_id\": \"<string>\",\n      \"mode\": \"value\"\n    }\n  ],\n  \"summary_require_intersection\": true\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.example.com/v2/{entity}/{project}/eval_results/query")
  .header("Content-Type", "application/json")
  .body("{\n  \"evaluation_call_ids\": [\n    \"<string>\"\n  ],\n  \"evaluation_run_ids\": [\n    \"<string>\"\n  ],\n  \"filter_logic_operator\": \"or\",\n  \"filters\": [\n    {\n      \"query\": {\n        \"$expr\": {\n          \"$and\": [\n            {\n              \"$literal\": \"<string>\"\n            }\n          ]\n        }\n      },\n      \"evaluation_call_id\": \"<string>\"\n    }\n  ],\n  \"include_costs\": false,\n  \"include_predict_and_score_children\": true,\n  \"include_raw_data_rows\": false,\n  \"include_rows\": true,\n  \"include_summary\": false,\n  \"limit\": 123,\n  \"offset\": 0,\n  \"require_intersection\": false,\n  \"resolve_row_refs\": false,\n  \"sort_by\": [\n    {\n      \"field\": \"<string>\",\n      \"evaluation_call_id\": \"<string>\",\n      \"mode\": \"value\"\n    }\n  ],\n  \"summary_require_intersection\": true\n}")
  .asString();

require 'uri'
require 'net/http'

url = URI("https://api.example.com/v2/{entity}/{project}/eval_results/query")

http = Net::HTTP.new(url.host, url.port)
http.use_ssl = true

request = Net::HTTP::Post.new(url)
request["Content-Type"] = 'application/json'
request.body = "{\n  \"evaluation_call_ids\": [\n    \"<string>\"\n  ],\n  \"evaluation_run_ids\": [\n    \"<string>\"\n  ],\n  \"filter_logic_operator\": \"or\",\n  \"filters\": [\n    {\n      \"query\": {\n        \"$expr\": {\n          \"$and\": [\n            {\n              \"$literal\": \"<string>\"\n            }\n          ]\n        }\n      },\n      \"evaluation_call_id\": \"<string>\"\n    }\n  ],\n  \"include_costs\": false,\n  \"include_predict_and_score_children\": true,\n  \"include_raw_data_rows\": false,\n  \"include_rows\": true,\n  \"include_summary\": false,\n  \"limit\": 123,\n  \"offset\": 0,\n  \"require_intersection\": false,\n  \"resolve_row_refs\": false,\n  \"sort_by\": [\n    {\n      \"field\": \"<string>\",\n      \"evaluation_call_id\": \"<string>\",\n      \"mode\": \"value\"\n    }\n  ],\n  \"summary_require_intersection\": true\n}"

response = http.request(request)
puts response.read_body

{
  "rows": [
    {
      "row_digest": "<string>",
      "evaluations": [
        {
          "evaluation_call_id": "<string>",
          "trials": [
            {
              "predict_and_score_call_id": "<string>",
              "genai_span_ref": [
                {
                  "span_id": "<string>",
                  "trace_id": "<string>"
                }
              ],
              "model_latency_seconds": 123,
              "model_output": null,
              "predict_call_id": "<string>",
              "scorer_call_ids": {},
              "scores": {},
              "total_cost": 123,
              "total_tokens": 123
            }
          ]
        }
      ],
      "raw_data_row": null
    }
  ],
  "total_rows": 123,
  "summary": {
    "evaluations": [
      {
        "evaluation_call_id": "<string>",
        "display_name": "<string>",
        "evaluation_ref": "<string>",
        "model_ref": "<string>",
        "predict_total_cost": 123,
        "predict_total_tokens": 123,
        "scorer_stats": [
          {
            "scorer_key": "<string>",
            "numeric_count": 0,
            "numeric_mean": 123,
            "pass_known_count": 0,
            "pass_rate": 123,
            "pass_signal_coverage": 123,
            "pass_true_count": 0,
            "path": "<string>",
            "trial_count": 0
          }
        ],
        "started_at": "<string>",
        "trace_id": "<string>",
        "trial_count": 0
      }
    ],
    "row_count": 0
  },
  "warnings": [
    "<string>"
  ]
}

{
  "detail": [
    {
      "loc": [
        "<string>"
      ],
      "msg": "<string>",
      "type": "<string>"
    }
  ]
}

Paramètres de chemin

entity

string

requis

project

string

requis

Corps

application/json

evaluation_call_ids

string[] | null

ID des appels racine d'évaluation à inclure.

evaluation_run_ids

string[] | null

Alias des ID d'appel d'évaluation provenant de l'API Evaluation Runs.

filter_logic_operator

enum<string>

défaut:or

Comment combiner les filtres entre les évaluations : 'and' (correspond à tous - la ligne doit correspondre dans TOUTES les évaluations) ou 'or' (correspond à au moins une - la ligne doit correspondre dans N’IMPORTE QUELLE évaluation). Valeur par défaut : 'or' (correspond à au moins une).

Options disponibles:

and,

or

filters

EvalResultsFilter · object[] | null

Filtres appliqués aux lignes groupées. Plusieurs filtres sont combinés avec AND.

Show child attributes

include_costs

boolean

défaut:false

Lorsque la valeur est true, ajoutez le coût aux appels enfants de prédiction et de scoring afin que la synthèse puisse indiquer predict_total_cost pour la prédiction seule. Activation facultative : les autres appelants ignorent le calcul du coût.

include_predict_and_score_children

boolean

défaut:true

Lorsque true (par défaut), récupère les appels enfants (predict/score) de chaque appel predict_and_score pour renseigner predict_call_id, scorer_call_ids et des données de latence/jeton plus précises. Lorsque false, ces champs sont dérivés de l’appel predict_and_score lui-même (predict_call_id et scorer_call_ids seront null/vides).

include_raw_data_rows

boolean

défaut:false

Lorsque cette valeur est true, renseignez raw_data_row sur chaque ligne de résultat. Les lignes inline sont renvoyées sous la forme de leur valeur dict ; les lignes référencées par un jeu de données sont renvoyées sous forme de chaîne de référence, sauf si resolve_row_refs est également true.

include_rows

boolean

défaut:true

Lorsque cette valeur est true, incluez les données groupées de ligne/essai dans rows et calculez total_rows pour la vue demandée au niveau ligne.

include_summary

boolean

défaut:false

Lorsque cette valeur est true, incluez dans summary les données de synthèse agrégées du scorer et de l'évaluation.

limit

integer | null

Taille de page facultative au niveau ligne, appliquée après le regroupement et l'intersection.

offset

integer

défaut:0

Décalage de page facultatif au niveau ligne, appliqué après le regroupement et l'intersection.

require_intersection

boolean

défaut:false

Lorsque cette valeur est true, incluez uniquement les lignes présentes dans toutes les évaluations demandées.

resolve_row_refs

boolean

défaut:false

Lorsque cette valeur est true (nécessite include_raw_data_rows=True), résolvez les chaînes de référence des lignes du jeu de données en données de ligne réelles via une recherche dans un tableau. Lorsque cette valeur est false, les références de ligne du jeu de données sont renvoyées telles quelles.

sort_by

EvalResultsSortBy · object[] | null

Spécification de tri des lignes de résultat. Préfixes de champ pris en charge : scores., inputs., outputs.. Lorsqu’elle est null, les lignes sont triées par row_digest ASC.

Show child attributes

summary_require_intersection

boolean | null

Comportement d'intersection facultatif pour la section de synthèse. Lorsqu'elle vaut null, la valeur de require_intersection est utilisée.

Réponse

Réponse réussie

rows

EvalResultsRow · object[]

requis

Show child attributes

total_rows

integer

requis

summary

EvalResultsSummaryRes · object | null

Show child attributes

warnings

string[]

Avertissements non fatals (par ex. échec de la résolution des références de ligne du jeu de données).

Lire le jeu de données

Lister les runs d’évaluation

W&B Models

W&B Weave

Serverless Inference

Serverless Training

Requête sur les résultats d’évaluation

Paramètres de chemin

Corps

Réponse