"2026-02-16T11:03:22.437871+00:00"2/16/2026, 11:03:22 AM
model
"qwen/qwen3.5-plus-20260216"
app_id
182717
external_user
(null)
streamed
true
cancelled
false
latency
860
moderation_latency
(null)
generation_time
12583
tokens_prompt
2275
tokens_completion
330
native_tokens_prompt
2321
native_tokens_completion
359
native_tokens_completion_images
(null)
native_tokens_reasoning
0
native_tokens_cached
0
num_media_prompt
(null)
num_input_audio_prompt
(null)
num_media_completion
0
num_search_results
(null)
origin
"https://ncbench.com/"
is_byok
false
finish_reason
"stop"
native_finish_reason
"stop"
usage
0.00179
router
(null)
provider_responses
0
id
"chatcmpl-d7bc90a3-22fb-9d97-ba57-4d73327ada67"
status
200
is_byok
false
latency
860
endpoint_id
"71e0f6c3-7815-4734-92d3-8a04f3b0ca91"
provider_name
"Alibaba"
model_permaslug
"qwen/qwen3.5-plus-20260216"
api_type
"completions"
id
"gen-1771239789-eHxuQeEIPfYpsc0NVJyX"
upstream_id
"chatcmpl-d7bc90a3-22fb-9d97-ba57-4d73327ada67"
total_cost
0.00179
cache_discount
(null)
upstream_inference_cost
0
provider_name
"Alibaba"
Evaluation details
Result
Evaluator
Details
Meta Data
75.0000%
Accuracy (recall)
Matched: 5/6, FP: 1
parsedCount
6
matched
5
total
6
falsePositives
1
expectedDetails
0
expected
entry
"855"
detail
"ruler"
summary
"Avaros is Prince Mammon's realm per the codex, but Eva says it is Prince Belphegor's domain."
status
"missed"
nearMiss
parsed
entry
"853"
detail
"ruler"
explanation
"The text attributes the domain of greed (Avaros) to Prince Belphegor, but the codex states Avaros is ruled by \"Prince Mammon\" and Belphegor rules Dymas (Gluttony)."
paragraph
2
substring
"Prince Belphegor's domain of greed"
reason
"entry mismatch: got \"853\", expected \"855\""
1
expected
entry
"4415"
detail
"eyeColor"
summary
"Lucien has one amber eye and one black eye (heterochromia), but the passage says both his amber eyes."
status
"matched"
matchedBy
entry
"4415"
detail
"eyeColor"
explanation
"The text says Lucien has two amber eyes, but the codex states his eyes are \"heterochromatic — one amber, one black\"."
paragraph
2
substring
"both his amber eyes"
location
extractedText
"both his amber eyes"
inBounds
true
expectedText
"both his amber eyes narrowed"
locationAccurate
true
2
expected
entry
"2002"
detail
"origin"
summary
"The Ledger of Debts originates from Avaros per its codex entry, but Eva says it came from Dymas."
status
"matched"
matchedBy
entry
"2002"
detail
"origin"
explanation
"The text claims the Ledger originated in Dymas, but the codex states its origin is \"Avaros\"."
paragraph
4
substring
"it originally came from Dymas, not Avaros"
location
extractedText
"it originally came from Dymas, not Avaros"
inBounds
true
expectedText
"it originally came from Dymas, not Avaros"
locationAccurate
true
3
expected
entry
"4416"
detail
"eyeColor"
summary
"Detective Quinn has brown eyes per her codex entry, but the passage says blue eyes."
status
"matched"
matchedBy
entry
"4416"
detail
"eyeColor"
explanation
"The text describes Detective Quinn's eyes as blue, but the codex states her eye color is \"brown\"."
paragraph
5
substring
"her blue eyes"
location
extractedText
"her blue eyes"
inBounds
true
expectedText
"her blue eyes watching the museum"
locationAccurate
true
4
expected
entry
"4416"
detail
"hair"
summary
"Detective Quinn has salt-and-pepper hair per her codex entry, but the passage says blonde hair."
status
"matched"
matchedBy
entry
"4416"
detail
"hair"
explanation
"The text describes Detective Quinn's hair as blonde, but the codex states her hair is \"closely cropped salt-and-pepper\"."
paragraph
5
substring
"Her short blonde hair"
location
extractedText
"Her short blonde hair"
inBounds
true
expectedText
"Her short blonde hair"
locationAccurate
true
5
expected
entry
"4414"
detail
"glasses"
summary
"Eva wears round glasses per her codex entry, but the passage says square glasses."
status
"matched"
matchedBy
entry
"4414"
detail
"glasses"
explanation
"The text describes Eva's glasses as square, but the codex states she wears \"round glasses\"."
paragraph
1
substring
"square glasses"
location
extractedText
"square glasses"
inBounds
true
expectedText
"her square glasses"
locationAccurate
true
falsePositiveDetails
0
parsed
entry
"853"
detail
"ruler"
explanation
"The text attributes the domain of greed (Avaros) to Prince Belphegor, but the codex states Avaros is ruled by \"Prince Mammon\" and Belphegor rules Dymas (Gluttony)."
paragraph
2
substring
"Prince Belphegor's domain of greed"
status
"false_positive"
location
extractedText
"Prince Belphegor's domain of greed"
inBounds
true
expectedText
"Prince Belphegor's domain of greed"
locationAccurate
true
closestExpected
entry
"855"
detail
"ruler"
summary
"Avaros is Prince Mammon's realm per the codex, but Eva says it is Prince Belphegor's domain."
reason
"entry mismatch: got \"853\", expected \"855\""
83.3333%
Precision
True positives: 5/6
totalReported
6
truePositives
5
reportedDetails
0
parsed
entry
"4414"
detail
"glasses"
explanation
"The text describes Eva's glasses as square, but the codex states she wears \"round glasses\"."
paragraph
1
substring
"square glasses"
status
"true_positive"
matchedExpected
entry
"4414"
detail
"glasses"
summary
"Eva wears round glasses per her codex entry, but the passage says square glasses."
location
extractedText
"square glasses"
inBounds
true
expectedText
"her square glasses"
locationAccurate
true
1
parsed
entry
"853"
detail
"ruler"
explanation
"The text attributes the domain of greed (Avaros) to Prince Belphegor, but the codex states Avaros is ruled by \"Prince Mammon\" and Belphegor rules Dymas (Gluttony)."
paragraph
2
substring
"Prince Belphegor's domain of greed"
status
"false_positive"
location
extractedText
"Prince Belphegor's domain of greed"
inBounds
true
expectedText
"Prince Belphegor's domain of greed"
locationAccurate
true
closestExpected
entry
"855"
detail
"ruler"
summary
"Avaros is Prince Mammon's realm per the codex, but Eva says it is Prince Belphegor's domain."
reason
"entry mismatch: got \"853\", expected \"855\""
2
parsed
entry
"4415"
detail
"eyeColor"
explanation
"The text says Lucien has two amber eyes, but the codex states his eyes are \"heterochromatic — one amber, one black\"."
paragraph
2
substring
"both his amber eyes"
status
"true_positive"
matchedExpected
entry
"4415"
detail
"eyeColor"
summary
"Lucien has one amber eye and one black eye (heterochromia), but the passage says both his amber eyes."
location
extractedText
"both his amber eyes"
inBounds
true
expectedText
"both his amber eyes narrowed"
locationAccurate
true
3
parsed
entry
"2002"
detail
"origin"
explanation
"The text claims the Ledger originated in Dymas, but the codex states its origin is \"Avaros\"."
paragraph
4
substring
"it originally came from Dymas, not Avaros"
status
"true_positive"
matchedExpected
entry
"2002"
detail
"origin"
summary
"The Ledger of Debts originates from Avaros per its codex entry, but Eva says it came from Dymas."
location
extractedText
"it originally came from Dymas, not Avaros"
inBounds
true
expectedText
"it originally came from Dymas, not Avaros"
locationAccurate
true
4
parsed
entry
"4416"
detail
"eyeColor"
explanation
"The text describes Detective Quinn's eyes as blue, but the codex states her eye color is \"brown\"."
paragraph
5
substring
"her blue eyes"
status
"true_positive"
matchedExpected
entry
"4416"
detail
"eyeColor"
summary
"Detective Quinn has brown eyes per her codex entry, but the passage says blue eyes."
location
extractedText
"her blue eyes"
inBounds
true
expectedText
"her blue eyes watching the museum"
locationAccurate
true
5
parsed
entry
"4416"
detail
"hair"
explanation
"The text describes Detective Quinn's hair as blonde, but the codex states her hair is \"closely cropped salt-and-pepper\"."
paragraph
5
substring
"Her short blonde hair"
status
"true_positive"
matchedExpected
entry
"4416"
detail
"hair"
summary
"Detective Quinn has salt-and-pepper hair per her codex entry, but the passage says blonde hair."