"2026-02-16T00:19:13.789621+00:00"2/16/2026, 12:19:13 AM
model
"google/gemini-2.5-flash"
app_id
182717
external_user
(null)
streamed
true
cancelled
false
latency
258
moderation_latency
(null)
generation_time
1637
tokens_prompt
2275
tokens_completion
364
native_tokens_prompt
2271
native_tokens_completion
402
native_tokens_completion_images
0
native_tokens_reasoning
0
native_tokens_cached
2038
num_media_prompt
(null)
num_input_audio_prompt
(null)
num_media_completion
0
num_search_results
(null)
origin
"https://ncbench.com/"
is_byok
false
finish_reason
"stop"
native_finish_reason
"STOP"
usage
0.00113604
router
(null)
provider_responses
0
status
200
is_byok
false
latency
258
endpoint_id
"16c01e26-9b91-4d22-b487-ed35634b017d"
provider_name
"Google AI Studio"
model_permaslug
"google/gemini-2.5-flash"
api_type
"completions"
id
"gen-1771201151-yu88DAme9BvENnWJHfbi"
upstream_id
(null)
total_cost
0.00113604
cache_discount
0.00055026
upstream_inference_cost
0
provider_name
"Google AI Studio"
Evaluation details
Result
Evaluator
Details
Meta Data
91.6667%
Accuracy (recall)
Matched: 6/6, FP: 1
parsedCount
7
matched
6
total
6
falsePositives
1
expectedDetails
0
expected
entry
"855"
detail
"ruler"
summary
"Avaros is Prince Mammon's realm per the codex, but Eva says it is Prince Belphegor's domain."
status
"matched"
matchedBy
entry
"855"
detail
"ruler"
explanation
"The text states Avaros is Prince Belphegor's domain of greed, but the codex states Avaros is ruled by Prince Mammon and Dymas is ruled by Prince Belphegor."
paragraph
2
substring
"Prince Belphegor's domain of greed"
location
extractedText
"Prince Belphegor's domain of greed"
inBounds
true
expectedText
"Prince Belphegor's domain of greed"
locationAccurate
true
1
expected
entry
"4415"
detail
"eyeColor"
summary
"Lucien has one amber eye and one black eye (heterochromia), but the passage says both his amber eyes."
status
"matched"
matchedBy
entry
"4415"
detail
"eyeColor"
explanation
"Lucien's eyes are heterochromatic (one amber, one black), but the text implies both are amber."
paragraph
2
substring
"both his amber eyes narrowed"
location
extractedText
"both his amber eyes narrowed"
inBounds
true
expectedText
"both his amber eyes narrowed"
locationAccurate
true
2
expected
entry
"2002"
detail
"origin"
summary
"The Ledger of Debts originates from Avaros per its codex entry, but Eva says it came from Dymas."
status
"matched"
matchedBy
entry
"2002"
detail
"origin"
explanation
"The text states the Ledger of Debts came from Dymas, but the codex states its origin is Avaros."
paragraph
4
substring
"Dymas, not Avaros"
location
extractedText
"Dymas, not Avaros"
inBounds
true
expectedText
"it originally came from Dymas, not Avaros"
locationAccurate
true
3
expected
entry
"4416"
detail
"eyeColor"
summary
"Detective Quinn has brown eyes per her codex entry, but the passage says blue eyes."
status
"matched"
matchedBy
entry
"4416"
detail
"eyeColor"
explanation
"Detective Quinn's eye color is brown, not blue."
paragraph
5
substring
"her blue eyes watching"
location
extractedText
"her blue eyes watching"
inBounds
true
expectedText
"her blue eyes watching the museum"
locationAccurate
true
4
expected
entry
"4416"
detail
"hair"
summary
"Detective Quinn has salt-and-pepper hair per her codex entry, but the passage says blonde hair."
status
"matched"
matchedBy
entry
"4416"
detail
"hair"
explanation
"Detective Quinn's hair is \"closely cropped salt-and-pepper\", not short blonde."
paragraph
5
substring
"short blonde hair"
location
extractedText
"short blonde hair"
inBounds
true
expectedText
"Her short blonde hair"
locationAccurate
true
5
expected
entry
"4414"
detail
"glasses"
summary
"Eva wears round glasses per her codex entry, but the passage says square glasses."
status
"matched"
matchedBy
entry
"4414"
detail
"glasses"
explanation
"Eva's glasses are described as 'square' in the text, but the codex states 'round glasses'."
paragraph
1
substring
"square glasses"
location
extractedText
"square glasses"
inBounds
true
expectedText
"her square glasses"
locationAccurate
true
falsePositiveDetails
0
parsed
entry
"855"
detail
"sin"
explanation
"The text states Avaros is Prince Belphegor's domain of greed, but the codex states Avaros is ruled by Prince Mammon and Dymas is ruled by Prince Belphegor."
paragraph
2
substring
"Prince Belphegor's domain of greed"
status
"false_positive"
location
extractedText
"Prince Belphegor's domain of greed"
inBounds
true
expectedText
"Prince Belphegor's domain of greed"
locationAccurate
true
closestExpected
entry
"855"
detail
"ruler"
summary
"Avaros is Prince Mammon's realm per the codex, but Eva says it is Prince Belphegor's domain."
"Eva's glasses are described as 'square' in the text, but the codex states 'round glasses'."
paragraph
1
substring
"square glasses"
status
"true_positive"
matchedExpected
entry
"4414"
detail
"glasses"
summary
"Eva wears round glasses per her codex entry, but the passage says square glasses."
location
extractedText
"square glasses"
inBounds
true
expectedText
"her square glasses"
locationAccurate
true
1
parsed
entry
"855"
detail
"sin"
explanation
"The text states Avaros is Prince Belphegor's domain of greed, but the codex states Avaros is ruled by Prince Mammon and Dymas is ruled by Prince Belphegor."
paragraph
2
substring
"Prince Belphegor's domain of greed"
status
"false_positive"
location
extractedText
"Prince Belphegor's domain of greed"
inBounds
true
expectedText
"Prince Belphegor's domain of greed"
locationAccurate
true
closestExpected
entry
"855"
detail
"ruler"
summary
"Avaros is Prince Mammon's realm per the codex, but Eva says it is Prince Belphegor's domain."
"The text states Avaros is Prince Belphegor's domain of greed, but the codex states Avaros is ruled by Prince Mammon and Dymas is ruled by Prince Belphegor."
paragraph
2
substring
"Prince Belphegor's domain of greed"
status
"true_positive"
matchedExpected
entry
"855"
detail
"ruler"
summary
"Avaros is Prince Mammon's realm per the codex, but Eva says it is Prince Belphegor's domain."
location
extractedText
"Prince Belphegor's domain of greed"
inBounds
true
expectedText
"Prince Belphegor's domain of greed"
locationAccurate
true
3
parsed
entry
"4415"
detail
"eyeColor"
explanation
"Lucien's eyes are heterochromatic (one amber, one black), but the text implies both are amber."
paragraph
2
substring
"both his amber eyes narrowed"
status
"true_positive"
matchedExpected
entry
"4415"
detail
"eyeColor"
summary
"Lucien has one amber eye and one black eye (heterochromia), but the passage says both his amber eyes."
location
extractedText
"both his amber eyes narrowed"
inBounds
true
expectedText
"both his amber eyes narrowed"
locationAccurate
true
4
parsed
entry
"2002"
detail
"origin"
explanation
"The text states the Ledger of Debts came from Dymas, but the codex states its origin is Avaros."
paragraph
4
substring
"Dymas, not Avaros"
status
"true_positive"
matchedExpected
entry
"2002"
detail
"origin"
summary
"The Ledger of Debts originates from Avaros per its codex entry, but Eva says it came from Dymas."
location
extractedText
"Dymas, not Avaros"
inBounds
true
expectedText
"it originally came from Dymas, not Avaros"
locationAccurate
true
5
parsed
entry
"4416"
detail
"eyeColor"
explanation
"Detective Quinn's eye color is brown, not blue."
paragraph
5
substring
"her blue eyes watching"
status
"true_positive"
matchedExpected
entry
"4416"
detail
"eyeColor"
summary
"Detective Quinn has brown eyes per her codex entry, but the passage says blue eyes."
location
extractedText
"her blue eyes watching"
inBounds
true
expectedText
"her blue eyes watching the museum"
locationAccurate
true
6
parsed
entry
"4416"
detail
"hair"
explanation
"Detective Quinn's hair is \"closely cropped salt-and-pepper\", not short blonde."
paragraph
5
substring
"short blonde hair"
status
"true_positive"
matchedExpected
entry
"4416"
detail
"hair"
summary
"Detective Quinn has salt-and-pepper hair per her codex entry, but the passage says blonde hair."