deepseek-chat
2026-06-14T01:50:54 · deepseek · convergence_v23_deepseek_2026-06-14T01-50-54.json
n/a
γ Overall
3
Passes
0
Passed
120
Errors
γ Breakdown
| Category | Value | Status |
|---|---|---|
| Objective | n/a | γ |
| Interpretive | n/a | γ |
| Judge | n/a | γ |
| Flapper | n/a | γ |
Raw JSON
Show raw data
{
"metadata": {
"category_counts": {
"flapper": 6,
"interpretive": 12,
"judge": 10,
"objective": 12
},
"judge_model": "deepseek-reasoner",
"judge_substrate": "deepseek",
"model": "deepseek-chat",
"passes": 3,
"substrate": "deepseek",
"timestamp": "2026-06-14T01:50:54.892423+00:00",
"total_tests": 40,
"version": "2.3"
},
"pass_verdict_vectors": {
"pass_1": {
"flapper": [
null,
null,
null,
null,
null,
null
],
"interpretive": [
null,
null,
null,
null,
null,
null,
null,
null,
null,
null,
null,
null
],
"judge": [
null,
null,
null,
null,
null,
null,
null,
null,
null,
null
],
"objective": [
null,
null,
null,
null,
null,
null,
null,
null,
null,
null,
null,
null
]
},
"pass_2": {
"flapper": [
null,
null,
null,
null,
null,
null
],
"interpretive": [
null,
null,
null,
null,
null,
null,
null,
null,
null,
null,
null,
null
],
"judge": [
null,
null,
null,
null,
null,
null,
null,
null,
null,
null
],
"objective": [
null,
null,
null,
null,
null,
null,
null,
null,
null,
null,
null,
null
]
},
"pass_3": {
"flapper": [
null,
null,
null,
null,
null,
null
],
"interpretive": [
null,
null,
null,
null,
null,
null,
null,
null,
null,
null,
null,
null
],
"judge": [
null,
null,
null,
null,
null,
null,
null,
null,
null,
null
],
"objective": [
null,
null,
null,
null,
null,
null,
null,
null,
null,
null,
null,
null
]
}
},
"stats": {
"judge_calls": 0,
"judge_errors": 0,
"model_calls": 0,
"model_errors": 120
},
"verdict_logging": [
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_001",
"ts": "2026-06-14T01:50:55.551268+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_002",
"ts": "2026-06-14T01:50:56.904675+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_003",
"ts": "2026-06-14T01:50:58.312275+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_004",
"ts": "2026-06-14T01:50:59.663694+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_005",
"ts": "2026-06-14T01:51:01.018297+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_006",
"ts": "2026-06-14T01:51:02.367895+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_007",
"ts": "2026-06-14T01:51:03.717023+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_008",
"ts": "2026-06-14T01:51:05.072937+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_009",
"ts": "2026-06-14T01:51:06.427910+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_010",
"ts": "2026-06-14T01:51:07.766366+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_011",
"ts": "2026-06-14T01:51:09.093204+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_012",
"ts": "2026-06-14T01:51:10.509714+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_001",
"ts": "2026-06-14T01:51:11.867116+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_002",
"ts": "2026-06-14T01:51:13.230878+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_003",
"ts": "2026-06-14T01:51:14.662344+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_004",
"ts": "2026-06-14T01:51:16.016519+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_005",
"ts": "2026-06-14T01:51:17.376529+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_006",
"ts": "2026-06-14T01:51:18.720318+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_007",
"ts": "2026-06-14T01:51:20.071404+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_008",
"ts": "2026-06-14T01:51:21.422528+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_009",
"ts": "2026-06-14T01:51:22.758795+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_010",
"ts": "2026-06-14T01:51:24.114900+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_011",
"ts": "2026-06-14T01:51:25.462499+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_012",
"ts": "2026-06-14T01:51:26.809797+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_001",
"ts": "2026-06-14T01:51:28.152575+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_002",
"ts": "2026-06-14T01:51:29.506381+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_003",
"ts": "2026-06-14T01:51:30.859642+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_004",
"ts": "2026-06-14T01:51:32.197062+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_005",
"ts": "2026-06-14T01:51:33.537924+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_006",
"ts": "2026-06-14T01:51:34.887709+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_007",
"ts": "2026-06-14T01:51:36.247999+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_008",
"ts": "2026-06-14T01:51:37.604727+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_009",
"ts": "2026-06-14T01:51:38.945667+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_010",
"ts": "2026-06-14T01:51:40.290701+00:00",
"verdict": null
},
{
"category": "flapper",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "FLAP_001",
"ts": "2026-06-14T01:51:41.632565+00:00",
"verdict": null
},
{
"category": "flapper",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "FLAP_002",
"ts": "2026-06-14T01:51:42.992708+00:00",
"verdict": null
},
{
"category": "flapper",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "FLAP_003",
"ts": "2026-06-14T01:51:44.340534+00:00",
"verdict": null
},
{
"category": "flapper",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "FLAP_004",
"ts": "2026-06-14T01:51:45.679524+00:00",
"verdict": null
},
{
"category": "flapper",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "FLAP_005",
"ts": "2026-06-14T01:51:47.027579+00:00",
"verdict": null
},
{
"category": "flapper",
"judge_reason": "skipped: model response was an error",
"pass": 1,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "FLAP_006",
"ts": "2026-06-14T01:51:48.366792+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_001",
"ts": "2026-06-14T01:51:49.706310+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_002",
"ts": "2026-06-14T01:51:51.059109+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_003",
"ts": "2026-06-14T01:51:52.394674+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_004",
"ts": "2026-06-14T01:51:53.754493+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_005",
"ts": "2026-06-14T01:51:55.154118+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_006",
"ts": "2026-06-14T01:51:56.512975+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_007",
"ts": "2026-06-14T01:51:57.845935+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_008",
"ts": "2026-06-14T01:51:59.221715+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_009",
"ts": "2026-06-14T01:52:00.582810+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_010",
"ts": "2026-06-14T01:52:01.936830+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_011",
"ts": "2026-06-14T01:52:03.281096+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_012",
"ts": "2026-06-14T01:52:04.621292+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_001",
"ts": "2026-06-14T01:52:05.956158+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_002",
"ts": "2026-06-14T01:52:07.306830+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_003",
"ts": "2026-06-14T01:52:08.641968+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_004",
"ts": "2026-06-14T01:52:09.991008+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_005",
"ts": "2026-06-14T01:52:11.339928+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_006",
"ts": "2026-06-14T01:52:12.686732+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_007",
"ts": "2026-06-14T01:52:14.029500+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_008",
"ts": "2026-06-14T01:52:15.447382+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_009",
"ts": "2026-06-14T01:52:16.782542+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_010",
"ts": "2026-06-14T01:52:18.124641+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_011",
"ts": "2026-06-14T01:52:19.469432+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_012",
"ts": "2026-06-14T01:52:20.886829+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_001",
"ts": "2026-06-14T01:52:22.237176+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_002",
"ts": "2026-06-14T01:52:23.577331+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_003",
"ts": "2026-06-14T01:52:24.932631+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_004",
"ts": "2026-06-14T01:52:26.262448+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_005",
"ts": "2026-06-14T01:52:27.628969+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_006",
"ts": "2026-06-14T01:52:28.989441+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_007",
"ts": "2026-06-14T01:52:30.373385+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_008",
"ts": "2026-06-14T01:52:31.724764+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_009",
"ts": "2026-06-14T01:52:33.062788+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_010",
"ts": "2026-06-14T01:52:34.470303+00:00",
"verdict": null
},
{
"category": "flapper",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "FLAP_001",
"ts": "2026-06-14T01:52:35.891469+00:00",
"verdict": null
},
{
"category": "flapper",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "FLAP_002",
"ts": "2026-06-14T01:52:37.251920+00:00",
"verdict": null
},
{
"category": "flapper",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "FLAP_003",
"ts": "2026-06-14T01:52:38.580359+00:00",
"verdict": null
},
{
"category": "flapper",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "FLAP_004",
"ts": "2026-06-14T01:52:39.929908+00:00",
"verdict": null
},
{
"category": "flapper",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "FLAP_005",
"ts": "2026-06-14T01:52:41.273321+00:00",
"verdict": null
},
{
"category": "flapper",
"judge_reason": "skipped: model response was an error",
"pass": 2,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "FLAP_006",
"ts": "2026-06-14T01:52:42.609392+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_001",
"ts": "2026-06-14T01:52:43.953459+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_002",
"ts": "2026-06-14T01:52:45.324487+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_003",
"ts": "2026-06-14T01:52:46.647440+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_004",
"ts": "2026-06-14T01:52:47.988435+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_005",
"ts": "2026-06-14T01:52:49.334959+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_006",
"ts": "2026-06-14T01:52:50.682249+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_007",
"ts": "2026-06-14T01:52:52.029785+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_008",
"ts": "2026-06-14T01:52:53.372929+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_009",
"ts": "2026-06-14T01:52:54.727646+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_010",
"ts": "2026-06-14T01:52:56.128978+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_011",
"ts": "2026-06-14T01:52:57.479071+00:00",
"verdict": null
},
{
"category": "objective",
"judge_reason": "skipped: error response",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "OBJ_012",
"ts": "2026-06-14T01:52:58.831897+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_001",
"ts": "2026-06-14T01:53:00.187291+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_002",
"ts": "2026-06-14T01:53:01.542489+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_003",
"ts": "2026-06-14T01:53:02.888343+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_004",
"ts": "2026-06-14T01:53:04.230092+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_005",
"ts": "2026-06-14T01:53:05.574242+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_006",
"ts": "2026-06-14T01:53:06.938995+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_007",
"ts": "2026-06-14T01:53:08.270056+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_008",
"ts": "2026-06-14T01:53:09.599685+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_009",
"ts": "2026-06-14T01:53:10.983384+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_010",
"ts": "2026-06-14T01:53:12.331499+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_011",
"ts": "2026-06-14T01:53:13.682528+00:00",
"verdict": null
},
{
"category": "interpretive",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "INT_012",
"ts": "2026-06-14T01:53:15.045346+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_001",
"ts": "2026-06-14T01:53:16.387625+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_002",
"ts": "2026-06-14T01:53:17.791559+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_003",
"ts": "2026-06-14T01:53:19.126156+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_004",
"ts": "2026-06-14T01:53:20.475752+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_005",
"ts": "2026-06-14T01:53:21.881104+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_006",
"ts": "2026-06-14T01:53:23.320883+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_007",
"ts": "2026-06-14T01:53:24.660103+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_008",
"ts": "2026-06-14T01:53:26.038408+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_009",
"ts": "2026-06-14T01:53:27.382597+00:00",
"verdict": null
},
{
"category": "judge",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "JUDGE_010",
"ts": "2026-06-14T01:53:28.757273+00:00",
"verdict": null
},
{
"category": "flapper",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "FLAP_001",
"ts": "2026-06-14T01:53:30.120644+00:00",
"verdict": null
},
{
"category": "flapper",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "FLAP_002",
"ts": "2026-06-14T01:53:31.466808+00:00",
"verdict": null
},
{
"category": "flapper",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "FLAP_003",
"ts": "2026-06-14T01:53:32.815036+00:00",
"verdict": null
},
{
"category": "flapper",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "FLAP_004",
"ts": "2026-06-14T01:53:34.164086+00:00",
"verdict": null
},
{
"category": "flapper",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "FLAP_005",
"ts": "2026-06-14T01:53:35.534751+00:00",
"verdict": null
},
{
"category": "flapper",
"judge_reason": "skipped: model response was an error",
"pass": 3,
"response_snippet": "[ERROR: 401 Client Error: Unauthorized for url: https://api.deepseek.com/chat/completions]",
"test_id": "FLAP_006",
"ts": "2026-06-14T01:53:36.880459+00:00",
"verdict": null
}
],
"wobble_excluded_tests": {
"flapper": 6,
"interpretive": 12,
"judge": 10,
"objective": 12
},
"wobble_metrics": {
"flapper": null,
"interpretive": null,
"judge": null,
"objective": null,
"overall_weighted": null
}
}