"2026-02-16T11:07:31.744742+00:00"2/16/2026, 11:07:31 AM
model
"qwen/qwen3.5-plus-20260216"
app_id
182717
external_user
(null)
streamed
true
cancelled
false
latency
1019
moderation_latency
(null)
generation_time
34589
tokens_prompt
3813
tokens_completion
971
native_tokens_prompt
3907
native_tokens_completion
973
native_tokens_completion_images
(null)
native_tokens_reasoning
0
native_tokens_cached
0
num_media_prompt
(null)
num_input_audio_prompt
(null)
num_media_completion
0
num_search_results
(null)
origin
"https://ncbench.com/"
is_byok
false
finish_reason
"stop"
native_finish_reason
"stop"
usage
0.003898
router
(null)
provider_responses
0
id
"chatcmpl-be926143-c169-9d51-bc97-5fc0957438ec"
status
200
is_byok
false
latency
1019
endpoint_id
"71e0f6c3-7815-4734-92d3-8a04f3b0ca91"
provider_name
"Alibaba"
model_permaslug
"qwen/qwen3.5-plus-20260216"
api_type
"completions"
id
"gen-1771240016-eq4GYO6VD0E1amDAEfWE"
upstream_id
"chatcmpl-be926143-c169-9d51-bc97-5fc0957438ec"
total_cost
0.003898
cache_discount
(null)
upstream_inference_cost
0
provider_name
"Alibaba"
Evaluation details
Result
Evaluator
Details
Meta Data
50.0000%
Accuracy (recall)
Matched: 6/11, FP: 1
parsedCount
7
matched
6
total
11
falsePositives
1
expectedDetails
0
expected
entry
"856"
detail
"currentLocation"
summary
"The Veil Market is beneath Camden per the codex, but the passage says Shoreditch."
status
"matched"
matchedBy
entry
"856"
detail
"currentLocation"
explanation
"The text states the market is beneath Shoreditch, but the codex says it is beneath Camden."
paragraph
1
substring
"abandoned Tube station beneath Shoreditch"
location
extractedText
"abandoned Tube station beneath Shoreditch"
inBounds
true
expectedText
"the abandoned Tube station beneath Shoreditch"
locationAccurate
true
1
expected
entry
"4418"
detail
"eyeColor"
summary
"Nyx has violet eyes per the codex, but the passage says blue eyes."
status
"matched"
matchedBy
entry
"4418"
detail
"eyeColor"
explanation
"The text describes Nyx's eyes as blue, but the codex states they are faintly glowing violet."
paragraph
1
substring
"glowing blue eyes"
location
extractedText
"glowing blue eyes"
inBounds
true
expectedText
"their glowing blue eyes"
locationAccurate
true
2
expected
entry
"4417"
detail
"scar"
summary
"Tomás has a scar on his left forearm per the codex, but the passage says right forearm."
status
"matched"
matchedBy
entry
"4417"
detail
"scar"
explanation
"The text places Tomás's scar on his right forearm, but the codex specifies it is on his left forearm."
paragraph
2
substring
"scarred right forearm"
location
extractedText
"scarred right forearm"
inBounds
true
expectedText
"his scarred right forearm"
locationAccurate
true
3
expected
entry
"4417"
detail
"birthplace"
summary
"Tomás was born in Seville per the codex, but the passage implies Madrid via his accent."
status
"matched"
matchedBy
entry
"4417"
detail
"birthplace"
explanation
"The text implies Tomás is from Madrid via his accent, but the codex states his birthplace is Seville, Spain."
paragraph
2
substring
"Madrid accent"
location
extractedText
"Madrid accent"
inBounds
true
expectedText
"his Madrid accent"
locationAccurate
true
4
expected
entry
"4420"
detail
"hair"
summary
"Kai has dyed electric-blue hair per the codex, but the passage says natural black hair."
status
"matched"
matchedBy
entry
"4420"
detail
"hair"
explanation
"The text describes Kai's hair as natural black, but the codex states it is dyed electric-blue."
paragraph
3
substring
"natural black hair"
location
extractedText
"natural black hair"
inBounds
true
expectedText
"His natural black hair"
locationAccurate
true
5
expected
entry
"4419"
detail
"eyeColor"
summary
"Maggie has sharp grey eyes per the codex, but the passage says green eyes."
status
"matched"
matchedBy
entry
"4419"
detail
"eyeColor"
explanation
"The text describes Maggie's eyes as green, but the codex states they are sharp grey."
paragraph
4
substring
"keen green eyes"
location
extractedText
"keen green eyes"
inBounds
true
expectedText
"her keen green eyes"
locationAccurate
true
6
expected
entry
"6002"
detail
"headquarters"
summary
"The Crimson Court is headquartered in Dymas per the codex, but Maggie says their base is in Avaros."
status
"missed"
7
expected
entry
"2003"
detail
"material"
summary
"The Irathi War Gauntlet is blackened iron with red runes per the codex, but the passage says gleaming steel with blue runes."
status
"missed"
8
expected
entry
"2003"
detail
"origin"
summary
"The Irathi War Gauntlet is from Irath per the codex, but the merchant says it's from Dymas."
status
"missed"
9
expected
entry
"2003"
detail
"creator"
summary
"The Irathi War Gauntlet was forged by a demon smith named Gorath per the codex, but the merchant attributes it to Prince Abaddon."
status
"missed"
10
expected
entry
"2004"
detail
"faceMarkings"
summary
"The Veil Compass face is etched with sigils per the codex, but the passage says the face is smooth and unmarked."
status
"missed"
falsePositiveDetails
0
parsed
entry
"4419"
detail
"walkingStick"
explanation
"The text refers to Maggie using a cane, but the codex specifies she uses a blackthorn walking stick (while Tomás is the one associated with medical/mobility issues implicitly, Maggie's item is distinct). *Correction*: The codex explicitly lists \"walkingStick\" for Maggie, so \"cane\" is acceptable synonymy, BUT the location of the Crimson Court is the bigger issue here. Let's re-evaluate \"cane\". Codex says \"blackthorn walking stick\". Text says \"cane\". This is likely acceptable. However, the statement about the Crimson Court base is wrong."
paragraph
4
substring
"tapped her cane"
status
"false_positive"
location
extractedText
"tapped her cane"
inBounds
true
expectedText
"her keen green eyes"
locationAccurate
false
closestExpected
entry
"4419"
detail
"eyeColor"
summary
"Maggie has sharp grey eyes per the codex, but the passage says green eyes."
"The text states the market is beneath Shoreditch, but the codex says it is beneath Camden."
paragraph
1
substring
"abandoned Tube station beneath Shoreditch"
status
"true_positive"
matchedExpected
entry
"856"
detail
"currentLocation"
summary
"The Veil Market is beneath Camden per the codex, but the passage says Shoreditch."
location
extractedText
"abandoned Tube station beneath Shoreditch"
inBounds
true
expectedText
"the abandoned Tube station beneath Shoreditch"
locationAccurate
true
1
parsed
entry
"4418"
detail
"eyeColor"
explanation
"The text describes Nyx's eyes as blue, but the codex states they are faintly glowing violet."
paragraph
1
substring
"glowing blue eyes"
status
"true_positive"
matchedExpected
entry
"4418"
detail
"eyeColor"
summary
"Nyx has violet eyes per the codex, but the passage says blue eyes."
location
extractedText
"glowing blue eyes"
inBounds
true
expectedText
"their glowing blue eyes"
locationAccurate
true
2
parsed
entry
"4417"
detail
"scar"
explanation
"The text places Tomás's scar on his right forearm, but the codex specifies it is on his left forearm."
paragraph
2
substring
"scarred right forearm"
status
"true_positive"
matchedExpected
entry
"4417"
detail
"scar"
summary
"Tomás has a scar on his left forearm per the codex, but the passage says right forearm."
location
extractedText
"scarred right forearm"
inBounds
true
expectedText
"his scarred right forearm"
locationAccurate
true
3
parsed
entry
"4417"
detail
"birthplace"
explanation
"The text implies Tomás is from Madrid via his accent, but the codex states his birthplace is Seville, Spain."
paragraph
2
substring
"Madrid accent"
status
"true_positive"
matchedExpected
entry
"4417"
detail
"birthplace"
summary
"Tomás was born in Seville per the codex, but the passage implies Madrid via his accent."
location
extractedText
"Madrid accent"
inBounds
true
expectedText
"his Madrid accent"
locationAccurate
true
4
parsed
entry
"4420"
detail
"hair"
explanation
"The text describes Kai's hair as natural black, but the codex states it is dyed electric-blue."
paragraph
3
substring
"natural black hair"
status
"true_positive"
matchedExpected
entry
"4420"
detail
"hair"
summary
"Kai has dyed electric-blue hair per the codex, but the passage says natural black hair."
location
extractedText
"natural black hair"
inBounds
true
expectedText
"His natural black hair"
locationAccurate
true
5
parsed
entry
"4419"
detail
"eyeColor"
explanation
"The text describes Maggie's eyes as green, but the codex states they are sharp grey."
paragraph
4
substring
"keen green eyes"
status
"true_positive"
matchedExpected
entry
"4419"
detail
"eyeColor"
summary
"Maggie has sharp grey eyes per the codex, but the passage says green eyes."
location
extractedText
"keen green eyes"
inBounds
true
expectedText
"her keen green eyes"
locationAccurate
true
6
parsed
entry
"4419"
detail
"walkingStick"
explanation
"The text refers to Maggie using a cane, but the codex specifies she uses a blackthorn walking stick (while Tomás is the one associated with medical/mobility issues implicitly, Maggie's item is distinct). *Correction*: The codex explicitly lists \"walkingStick\" for Maggie, so \"cane\" is acceptable synonymy, BUT the location of the Crimson Court is the bigger issue here. Let's re-evaluate \"cane\". Codex says \"blackthorn walking stick\". Text says \"cane\". This is likely acceptable. However, the statement about the Crimson Court base is wrong."
paragraph
4
substring
"tapped her cane"
status
"false_positive"
location
extractedText
"tapped her cane"
inBounds
true
expectedText
"her keen green eyes"
locationAccurate
false
closestExpected
entry
"4419"
detail
"eyeColor"
summary
"Maggie has sharp grey eyes per the codex, but the passage says green eyes."