@pentatonic-ai/ai-agent-sdk 0.6.0 → 0.7.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (94) hide show
  1. package/README.md +170 -69
  2. package/bin/__tests__/callback-server.test.js +4 -1
  3. package/bin/cli.js +41 -164
  4. package/bin/commands/config.js +251 -0
  5. package/package.json +2 -1
  6. package/packages/doctor/__tests__/detect.test.js +2 -6
  7. package/packages/doctor/src/checks/local-memory.js +164 -196
  8. package/packages/doctor/src/detect.js +11 -3
  9. package/packages/memory/src/corpus/adapters.js +104 -0
  10. package/packages/memory/src/corpus/cli.js +72 -7
  11. package/packages/memory/src/corpus/index.js +1 -1
  12. package/packages/memory-engine/.env.example +13 -0
  13. package/packages/memory-engine/README.md +131 -0
  14. package/packages/memory-engine/bench/README.md +99 -0
  15. package/packages/memory-engine/bench/scorecards-engine/agent-coding__pentatonic-baseline__20260427-142523.json +1115 -0
  16. package/packages/memory-engine/bench/scorecards-engine/chat-recall__pentatonic-baseline__20260427-142648.json +819 -0
  17. package/packages/memory-engine/bench/scorecards-engine/circular-economy__pentatonic-baseline__20260427-142757.json +1278 -0
  18. package/packages/memory-engine/bench/scorecards-engine/customer-support__pentatonic-baseline__20260427-142900.json +1018 -0
  19. package/packages/memory-engine/bench/scorecards-engine/marketplace-ops__pentatonic-baseline__20260427-142957.json +1038 -0
  20. package/packages/memory-engine/bench/scorecards-engine/product-catalogue__pentatonic-baseline__20260427-143122.json +961 -0
  21. package/packages/memory-engine/bench/scorecards-engine-via-docker/agent-coding__pentatonic-memory__20260427-161812.json +1115 -0
  22. package/packages/memory-engine/bench/scorecards-engine-via-docker/chat-recall__pentatonic-memory__20260427-161701.json +819 -0
  23. package/packages/memory-engine/bench/scorecards-engine-via-docker/circular-economy__pentatonic-memory__20260427-161713.json +1278 -0
  24. package/packages/memory-engine/bench/scorecards-engine-via-docker/customer-support__pentatonic-memory__20260427-161723.json +1018 -0
  25. package/packages/memory-engine/bench/scorecards-engine-via-docker/marketplace-ops__pentatonic-memory__20260427-161732.json +1038 -0
  26. package/packages/memory-engine/bench/scorecards-engine-via-docker/product-catalogue__pentatonic-memory__20260427-161741.json +937 -0
  27. package/packages/memory-engine/bench/scorecards-engine-via-l2-7-layer-populated/agent-coding__pentatonic-memory__20260427-184718.json +1115 -0
  28. package/packages/memory-engine/bench/scorecards-engine-via-l2-7-layer-populated/chat-recall__pentatonic-memory__20260427-184614.json +819 -0
  29. package/packages/memory-engine/bench/scorecards-engine-via-l2-7-layer-populated/circular-economy__pentatonic-memory__20260427-184809.json +1278 -0
  30. package/packages/memory-engine/bench/scorecards-engine-via-l2-7-layer-populated/customer-support__pentatonic-memory__20260427-184854.json +1018 -0
  31. package/packages/memory-engine/bench/scorecards-engine-via-l2-7-layer-populated/marketplace-ops__pentatonic-memory__20260427-184929.json +1038 -0
  32. package/packages/memory-engine/bench/scorecards-engine-via-l2-7-layer-populated/product-catalogue__pentatonic-memory__20260427-185015.json +961 -0
  33. package/packages/memory-engine/bench/scorecards-engine-via-l2-empty-layers/agent-coding__pentatonic-memory__20260427-175252.json +1115 -0
  34. package/packages/memory-engine/bench/scorecards-engine-via-l2-empty-layers/chat-recall__pentatonic-memory__20260427-175312.json +819 -0
  35. package/packages/memory-engine/bench/scorecards-engine-via-l2-empty-layers/circular-economy__pentatonic-memory__20260427-175335.json +1278 -0
  36. package/packages/memory-engine/bench/scorecards-engine-via-l2-empty-layers/customer-support__pentatonic-memory__20260427-175355.json +1018 -0
  37. package/packages/memory-engine/bench/scorecards-engine-via-l2-empty-layers/marketplace-ops__pentatonic-memory__20260427-175413.json +1038 -0
  38. package/packages/memory-engine/bench/scorecards-engine-via-l2-empty-layers/product-catalogue__pentatonic-memory__20260427-175430.json +883 -0
  39. package/packages/memory-engine/bench/scorecards-engine-via-shim/agent-coding__pentatonic-memory__20260427-155409.json +1115 -0
  40. package/packages/memory-engine/bench/scorecards-engine-via-shim/chat-recall__pentatonic-memory__20260427-155421.json +819 -0
  41. package/packages/memory-engine/bench/scorecards-engine-via-shim/circular-economy__pentatonic-memory__20260427-155433.json +1278 -0
  42. package/packages/memory-engine/bench/scorecards-engine-via-shim/customer-support__pentatonic-memory__20260427-155443.json +1018 -0
  43. package/packages/memory-engine/bench/scorecards-engine-via-shim/marketplace-ops__pentatonic-memory__20260427-155453.json +1038 -0
  44. package/packages/memory-engine/bench/scorecards-engine-via-shim/product-catalogue__pentatonic-memory__20260427-155503.json +937 -0
  45. package/packages/memory-engine/bench/scorecards-pentatonic-baseline/agent-coding__pentatonic-memory-latest__20260427-145103.json +1115 -0
  46. package/packages/memory-engine/bench/scorecards-pentatonic-baseline/agent-coding__pentatonic-memory__20260427-144909.json +1115 -0
  47. package/packages/memory-engine/bench/scorecards-pentatonic-baseline/chat-recall__pentatonic-memory-latest__20260427-145153.json +819 -0
  48. package/packages/memory-engine/bench/scorecards-pentatonic-baseline/chat-recall__pentatonic-memory__20260427-145120.json +542 -0
  49. package/packages/memory-engine/bench/scorecards-pentatonic-baseline/circular-economy__pentatonic-memory-latest__20260427-145313.json +1278 -0
  50. package/packages/memory-engine/bench/scorecards-pentatonic-baseline/circular-economy__pentatonic-memory__20260427-145207.json +894 -0
  51. package/packages/memory-engine/bench/scorecards-pentatonic-baseline/customer-support__pentatonic-memory-latest__20260427-145412.json +1018 -0
  52. package/packages/memory-engine/bench/scorecards-pentatonic-baseline/customer-support__pentatonic-memory__20260427-145327.json +680 -0
  53. package/packages/memory-engine/bench/scorecards-pentatonic-baseline/marketplace-ops__pentatonic-memory-latest__20260427-145517.json +1038 -0
  54. package/packages/memory-engine/bench/scorecards-pentatonic-baseline/marketplace-ops__pentatonic-memory__20260427-145422.json +693 -0
  55. package/packages/memory-engine/bench/scorecards-pentatonic-baseline/product-catalogue__pentatonic-memory-latest__20260427-145616.json +961 -0
  56. package/packages/memory-engine/bench/scorecards-pentatonic-baseline/product-catalogue__pentatonic-memory__20260427-145528.json +727 -0
  57. package/packages/memory-engine/compat/Dockerfile +11 -0
  58. package/packages/memory-engine/compat/server.py +680 -0
  59. package/packages/memory-engine/docker-compose.yml +243 -0
  60. package/packages/memory-engine/docs/MIGRATION.md +178 -0
  61. package/packages/memory-engine/docs/RUNBOOK-AWS.md +375 -0
  62. package/packages/memory-engine/docs/why-v05-underperforms.md +138 -0
  63. package/packages/memory-engine/engine/README.md +52 -0
  64. package/packages/memory-engine/engine/l2-hybridrag-proxy.py +1543 -0
  65. package/packages/memory-engine/engine/l5-comms-layer.py +663 -0
  66. package/packages/memory-engine/engine/l6-document-store.py +1018 -0
  67. package/packages/memory-engine/engine/services/l2/Dockerfile +41 -0
  68. package/packages/memory-engine/engine/services/l2/init_databases.py +81 -0
  69. package/packages/memory-engine/engine/services/l2/l2-hybridrag-proxy.py +1543 -0
  70. package/packages/memory-engine/engine/services/l4/Dockerfile +15 -0
  71. package/packages/memory-engine/engine/services/l4/server.py +235 -0
  72. package/packages/memory-engine/engine/services/l5/Dockerfile +9 -0
  73. package/packages/memory-engine/engine/services/l5/l5-comms-layer.py +678 -0
  74. package/packages/memory-engine/engine/services/l6/Dockerfile +11 -0
  75. package/packages/memory-engine/engine/services/l6/l6-document-store.py +1016 -0
  76. package/packages/memory-engine/engine/services/nv-embed/Dockerfile +28 -0
  77. package/packages/memory-engine/engine/services/nv-embed/server.py +152 -0
  78. package/packages/memory-engine/pme_memory/__init__.py +0 -0
  79. package/packages/memory-engine/pme_memory/__main__.py +129 -0
  80. package/packages/memory-engine/pme_memory/artifacts.py +95 -0
  81. package/packages/memory-engine/pme_memory/embed.py +74 -0
  82. package/packages/memory-engine/pme_memory/health.py +36 -0
  83. package/packages/memory-engine/pme_memory/hygiene.py +159 -0
  84. package/packages/memory-engine/pme_memory/indexer.py +200 -0
  85. package/packages/memory-engine/pme_memory/needs.py +55 -0
  86. package/packages/memory-engine/pme_memory/provenance.py +80 -0
  87. package/packages/memory-engine/pme_memory/scoring.py +168 -0
  88. package/packages/memory-engine/pme_memory/search.py +52 -0
  89. package/packages/memory-engine/pme_memory/store.py +86 -0
  90. package/packages/memory-engine/pme_memory/synthesis.py +114 -0
  91. package/packages/memory-engine/pyproject.toml +65 -0
  92. package/packages/memory-engine/scripts/kg-extractor.py +557 -0
  93. package/packages/memory-engine/scripts/kg-preflexor-v2.py +738 -0
  94. package/packages/memory-engine/tests/test_api_contract.sh +57 -0
@@ -0,0 +1,883 @@
1
+ {
2
+ "bench": "product-catalogue",
3
+ "stack": "pentatonic-memory",
4
+ "n_tasks": 18,
5
+ "n_correct": 13,
6
+ "accuracy": 0.7222222222222222,
7
+ "mean_score": 0.7777777777777778,
8
+ "p50_search_ms": 479.20782800065354,
9
+ "p95_search_ms": 560.5700919986703,
10
+ "total_tokens_in": 0,
11
+ "total_tokens_out": 0,
12
+ "total_usd": 0.0,
13
+ "by_tag": {
14
+ "factoid": {
15
+ "n": 10,
16
+ "mean_score": 0.95,
17
+ "accuracy": 0.9
18
+ },
19
+ "material": {
20
+ "n": 4,
21
+ "mean_score": 0.625,
22
+ "accuracy": 0.5
23
+ },
24
+ "spec": {
25
+ "n": 1,
26
+ "mean_score": 1.0,
27
+ "accuracy": 1.0
28
+ },
29
+ "warranty": {
30
+ "n": 1,
31
+ "mean_score": 1.0,
32
+ "accuracy": 1.0
33
+ },
34
+ "inventory": {
35
+ "n": 3,
36
+ "mean_score": 1.0,
37
+ "accuracy": 1.0
38
+ },
39
+ "compat": {
40
+ "n": 2,
41
+ "mean_score": 1.0,
42
+ "accuracy": 1.0
43
+ },
44
+ "multi-doc": {
45
+ "n": 3,
46
+ "mean_score": 0.6666666666666666,
47
+ "accuracy": 0.6666666666666666
48
+ },
49
+ "care": {
50
+ "n": 1,
51
+ "mean_score": 0.5,
52
+ "accuracy": 0.0
53
+ },
54
+ "policy": {
55
+ "n": 2,
56
+ "mean_score": 0.5,
57
+ "accuracy": 0.5
58
+ },
59
+ "pricing": {
60
+ "n": 2,
61
+ "mean_score": 1.0,
62
+ "accuracy": 1.0
63
+ },
64
+ "multi-hop": {
65
+ "n": 2,
66
+ "mean_score": 0.5,
67
+ "accuracy": 0.5
68
+ },
69
+ "math": {
70
+ "n": 1,
71
+ "mean_score": 0.0,
72
+ "accuracy": 0.0
73
+ },
74
+ "rubric": {
75
+ "n": 3,
76
+ "mean_score": 0.5,
77
+ "accuracy": 0.3333333333333333
78
+ },
79
+ "recommendation": {
80
+ "n": 1,
81
+ "mean_score": 0.0,
82
+ "accuracy": 0.0
83
+ },
84
+ "certification": {
85
+ "n": 1,
86
+ "mean_score": 1.0,
87
+ "accuracy": 1.0
88
+ },
89
+ "entity": {
90
+ "n": 1,
91
+ "mean_score": 0.0,
92
+ "accuracy": 0.0
93
+ }
94
+ },
95
+ "extra": {
96
+ "ingest_ms": 6794.70948598464,
97
+ "grading": "substring",
98
+ "limit": 3,
99
+ "tokens": {
100
+ "corpus_tokens": 1845,
101
+ "query_tokens": 271,
102
+ "context_tokens": 4995,
103
+ "retrieval_tokens": 5266,
104
+ "naive_tokens": 33481,
105
+ "saved_tokens": 28215,
106
+ "reduction_pct": 0.8427167647322362,
107
+ "mean_retrieval_tokens_per_task": 292.55555555555554,
108
+ "tokenizer": "cl100k_base",
109
+ "per_task": {
110
+ "sku-atlas-material": {
111
+ "query": 11,
112
+ "context": 137,
113
+ "retrieval": 148,
114
+ "judge_in": 0,
115
+ "judge_out": 0,
116
+ "judge_latency_ms": 0.0
117
+ },
118
+ "sku-luna-capacity": {
119
+ "query": 8,
120
+ "context": 144,
121
+ "retrieval": 152,
122
+ "judge_in": 0,
123
+ "judge_out": 0,
124
+ "judge_latency_ms": 0.0
125
+ },
126
+ "sku-luna-warranty": {
127
+ "query": 9,
128
+ "context": 144,
129
+ "retrieval": 153,
130
+ "judge_in": 0,
131
+ "judge_out": 0,
132
+ "judge_latency_ms": 0.0
133
+ },
134
+ "sku-kite-harness-out-of-stock": {
135
+ "query": 17,
136
+ "context": 340,
137
+ "retrieval": 357,
138
+ "judge_in": 0,
139
+ "judge_out": 0,
140
+ "judge_latency_ms": 0.0
141
+ },
142
+ "sku-kite-harness-restock": {
143
+ "query": 17,
144
+ "context": 340,
145
+ "retrieval": 357,
146
+ "judge_in": 0,
147
+ "judge_out": 0,
148
+ "judge_latency_ms": 0.0
149
+ },
150
+ "sku-tee-discontinued-sizes": {
151
+ "query": 13,
152
+ "context": 359,
153
+ "retrieval": 372,
154
+ "judge_in": 0,
155
+ "judge_out": 0,
156
+ "judge_latency_ms": 0.0
157
+ },
158
+ "sku-sleeve-compat-14-mbp": {
159
+ "query": 16,
160
+ "context": 332,
161
+ "retrieval": 348,
162
+ "judge_in": 0,
163
+ "judge_out": 0,
164
+ "judge_latency_ms": 0.0
165
+ },
166
+ "sku-coffee-cup-microwave": {
167
+ "query": 8,
168
+ "context": 291,
169
+ "retrieval": 299,
170
+ "judge_in": 0,
171
+ "judge_out": 0,
172
+ "judge_latency_ms": 0.0
173
+ },
174
+ "sku-bin-liners-home-compost": {
175
+ "query": 11,
176
+ "context": 283,
177
+ "retrieval": 294,
178
+ "judge_in": 0,
179
+ "judge_out": 0,
180
+ "judge_latency_ms": 0.0
181
+ },
182
+ "policy-custom-tote-return": {
183
+ "query": 10,
184
+ "context": 218,
185
+ "retrieval": 228,
186
+ "judge_in": 0,
187
+ "judge_out": 0,
188
+ "judge_latency_ms": 0.0
189
+ },
190
+ "price-tee-subscription": {
191
+ "query": 14,
192
+ "context": 223,
193
+ "retrieval": 237,
194
+ "judge_in": 0,
195
+ "judge_out": 0,
196
+ "judge_latency_ms": 0.0
197
+ },
198
+ "price-sleeve-diff": {
199
+ "query": 19,
200
+ "context": 332,
201
+ "retrieval": 351,
202
+ "judge_in": 0,
203
+ "judge_out": 0,
204
+ "judge_latency_ms": 0.0
205
+ },
206
+ "multi-hop-kite-duotone": {
207
+ "query": 25,
208
+ "context": 340,
209
+ "retrieval": 365,
210
+ "judge_in": 0,
211
+ "judge_out": 0,
212
+ "judge_latency_ms": 0.0
213
+ },
214
+ "multi-hop-takeback-credit": {
215
+ "query": 23,
216
+ "context": 300,
217
+ "retrieval": 323,
218
+ "judge_in": 0,
219
+ "judge_out": 0,
220
+ "judge_latency_ms": 0.0
221
+ },
222
+ "rubric-recommend-kitesurf-bag": {
223
+ "query": 31,
224
+ "context": 382,
225
+ "retrieval": 413,
226
+ "judge_in": 724,
227
+ "judge_out": 51,
228
+ "judge_latency_ms": 1100.580383002758
229
+ },
230
+ "rubric-plastic-free-tee": {
231
+ "query": 11,
232
+ "context": 393,
233
+ "retrieval": 404,
234
+ "judge_in": 701,
235
+ "judge_out": 50,
236
+ "judge_latency_ms": 1114.83097499609
237
+ },
238
+ "rubric-cc-certified-items": {
239
+ "query": 14,
240
+ "context": 300,
241
+ "retrieval": 314,
242
+ "judge_in": 589,
243
+ "judge_out": 29,
244
+ "judge_latency_ms": 567.9309439957142
245
+ },
246
+ "entity-recycled-content-high": {
247
+ "query": 14,
248
+ "context": 137,
249
+ "retrieval": 151,
250
+ "judge_in": 0,
251
+ "judge_out": 0,
252
+ "judge_latency_ms": 0.0
253
+ }
254
+ },
255
+ "judge_tokens_in": 2014,
256
+ "judge_tokens_out": 130,
257
+ "judge_calls": 3,
258
+ "judge_mean_latency_ms": 927.7807673315207
259
+ },
260
+ "cost_usd": {
261
+ "assumed_completion_tokens_per_task": 100,
262
+ "rates": {
263
+ "input_per_1k": 0.0025,
264
+ "output_per_1k": 0.01,
265
+ "model": "gpt-4o"
266
+ },
267
+ "retrieval_usd_in": 0.013165000000000001,
268
+ "retrieval_usd_out": 0.018,
269
+ "retrieval_usd_total": 0.031164999999999998,
270
+ "naive_usd_total": 0.1017025,
271
+ "saved_usd": 0.0705375,
272
+ "saved_usd_per_1k_tasks": 3.91875
273
+ }
274
+ },
275
+ "task_results": [
276
+ {
277
+ "task_id": "sku-atlas-material",
278
+ "query": "What's the material composition of the Atlas Phone Shell?",
279
+ "answer": "# Atlas Phone Shell \u2014 SKU ATL-PHN-001\n\n**Brand:** Atlas Circular\n**Category:** Mobile accessories / Phone cases\n**Compatible with:** iPhone 15, iPhone 15 Pro\n\n**Material composition:**\n- 68% recycled ocean-bound polypropylene\n- 24% recycled polycarbonate (post-consumer)\n- 8% natural calcium carbonate\n\n**Price:** \u00a329.00 GBP (standard) / \u00a324.00 (subscription)\n**Inventory:** 1,240 units in stock at UK fulfilment (Worthing DC)\n**Take-back:** Yes \u2014 returnable for 50% credit after 18 months\n**Certific",
280
+ "hits": [
281
+ {
282
+ "text": "# Atlas Phone Shell \u2014 SKU ATL-PHN-001\n\n**Brand:** Atlas Circular\n**Category:** Mobile accessories / Phone cases\n**Compatible with:** iPhone 15, iPhone 15 Pro\n\n**Material composition:**\n- 68% recycled ocean-bound polypropylene\n- 24% recycled polycarbonate (post-consumer)\n- 8% natural calcium carbonate\n\n**Price:** \u00a329.00 GBP (standard) / \u00a324.00 (subscription)\n**Inventory:** 1,240 units in stock at U",
283
+ "score": 0.4098,
284
+ "source": "pentatonic-memory",
285
+ "doc_id": "sku-atlas-phone-01"
286
+ }
287
+ ],
288
+ "correct": true,
289
+ "score": 1.0,
290
+ "grading_notes": "all substrings matched",
291
+ "search_time_ms": 486.80407798383385,
292
+ "generation_time_ms": 0.0,
293
+ "tokens_in": 0,
294
+ "tokens_out": 0,
295
+ "retrieval_tokens": 148,
296
+ "query_tokens": 11,
297
+ "context_tokens": 137,
298
+ "judge_tokens_in": 0,
299
+ "judge_tokens_out": 0,
300
+ "judge_latency_ms": 0.0
301
+ },
302
+ {
303
+ "task_id": "sku-luna-capacity",
304
+ "query": "What capacity is the Luna water bottle?",
305
+ "answer": "# Luna Water Bottle 500ml \u2014 SKU LUN-BTL-042\n\n**Brand:** Luna\n**Category:** Drinkware / Bottles\n**Capacity:** 500ml\n\n**Material composition:**\n- 100% food-grade 304 stainless steel (65% recycled content)\n- Lid: bio-based silicone (sugarcane derivative)\n\n**Price:** \u00a318.50 GBP\n**Inventory:** 87 units in stock (UK), 412 units (EU DC Eindhoven)\n**Colours available:** Matte black, Sage green, Terracotta\n**Replacement parts:** Lid (\u00a33.50), Silicone seal (\u00a30.90)\n**Warranty:** Lifetime on body, 2 years o",
306
+ "hits": [
307
+ {
308
+ "text": "# Luna Water Bottle 500ml \u2014 SKU LUN-BTL-042\n\n**Brand:** Luna\n**Category:** Drinkware / Bottles\n**Capacity:** 500ml\n\n**Material composition:**\n- 100% food-grade 304 stainless steel (65% recycled content)\n- Lid: bio-based silicone (sugarcane derivative)\n\n**Price:** \u00a318.50 GBP\n**Inventory:** 87 units in stock (UK), 412 units (EU DC Eindhoven)\n**Colours available:** Matte black, Sage green, Terracotta",
309
+ "score": 0.4098,
310
+ "source": "pentatonic-memory",
311
+ "doc_id": "sku-luna-bottle-42"
312
+ }
313
+ ],
314
+ "correct": true,
315
+ "score": 1.0,
316
+ "grading_notes": "all substrings matched",
317
+ "search_time_ms": 469.72510500927456,
318
+ "generation_time_ms": 0.0,
319
+ "tokens_in": 0,
320
+ "tokens_out": 0,
321
+ "retrieval_tokens": 152,
322
+ "query_tokens": 8,
323
+ "context_tokens": 144,
324
+ "judge_tokens_in": 0,
325
+ "judge_tokens_out": 0,
326
+ "judge_latency_ms": 0.0
327
+ },
328
+ {
329
+ "task_id": "sku-luna-warranty",
330
+ "query": "What's the warranty on the Luna bottle?",
331
+ "answer": "# Luna Water Bottle 500ml \u2014 SKU LUN-BTL-042\n\n**Brand:** Luna\n**Category:** Drinkware / Bottles\n**Capacity:** 500ml\n\n**Material composition:**\n- 100% food-grade 304 stainless steel (65% recycled content)\n- Lid: bio-based silicone (sugarcane derivative)\n\n**Price:** \u00a318.50 GBP\n**Inventory:** 87 units in stock (UK), 412 units (EU DC Eindhoven)\n**Colours available:** Matte black, Sage green, Terracotta\n**Replacement parts:** Lid (\u00a33.50), Silicone seal (\u00a30.90)\n**Warranty:** Lifetime on body, 2 years o",
332
+ "hits": [
333
+ {
334
+ "text": "# Luna Water Bottle 500ml \u2014 SKU LUN-BTL-042\n\n**Brand:** Luna\n**Category:** Drinkware / Bottles\n**Capacity:** 500ml\n\n**Material composition:**\n- 100% food-grade 304 stainless steel (65% recycled content)\n- Lid: bio-based silicone (sugarcane derivative)\n\n**Price:** \u00a318.50 GBP\n**Inventory:** 87 units in stock (UK), 412 units (EU DC Eindhoven)\n**Colours available:** Matte black, Sage green, Terracotta",
335
+ "score": 0.4032,
336
+ "source": "pentatonic-memory",
337
+ "doc_id": "sku-luna-bottle-42"
338
+ }
339
+ ],
340
+ "correct": true,
341
+ "score": 1.0,
342
+ "grading_notes": "all substrings matched",
343
+ "search_time_ms": 454.7847980284132,
344
+ "generation_time_ms": 0.0,
345
+ "tokens_in": 0,
346
+ "tokens_out": 0,
347
+ "retrieval_tokens": 153,
348
+ "query_tokens": 9,
349
+ "context_tokens": 144,
350
+ "judge_tokens_in": 0,
351
+ "judge_tokens_out": 0,
352
+ "judge_latency_ms": 0.0
353
+ },
354
+ {
355
+ "task_id": "sku-kite-harness-out-of-stock",
356
+ "query": "Which size of the Nomad Kite Harness v3 is currently out of stock?",
357
+ "answer": "# Nomad Kite Harness v3 \u2014 SKU NMD-HRN-V3\n\n**Brand:** Nomad Sports\n**Category:** Watersports / Kite surfing\n**Size range:** XS (26-28\"), S (28-30\"), M (30-32\"), L (32-34\"), XL (34-36\")\n\n**Material composition:**\n- Outer shell: 92% recycled nylon 6,6 (ghost-net source)\n- Foam padding: EVA (non-recycled)\n- Hardware: 316 stainless steel spreader bar\n\n**Price:** \u00a3145.00 GBP\n**Inventory:** M=out of stock, L=6 units, XL=12 units, XS/S=restock 2026-05-15\n**Repair service:** \u00a325 flat fee, turnaround 14 d\n---\n# Inventory update \u2014 2026-04-15\n\nPentatonic Crew Tee Black XXS/XXL: discontinued, not restocking.\nNomad Kite Harness v3 M: sold out, restock ETA 2026-05-15.\nHaven Laptop Sleeve 15\": Oat and Ochre sold through, Charcoal only until SS27 refresh.\nAtlas Phone Shell: new batch inbound 2026-04-28, inventory will top up to ~3000 units.\n---\n# Compatibility note\n\nThe Nomad Kite Harness v3 (NMD-HRN-V3) ships with a standard spreader bar compatible with F-One and North bar systems. For Duotone or Core bar systems, the Duotone/Core adapter kit (NMD-ADPT-DC, \u00a3 18) is required.",
358
+ "hits": [
359
+ {
360
+ "text": "# Nomad Kite Harness v3 \u2014 SKU NMD-HRN-V3\n\n**Brand:** Nomad Sports\n**Category:** Watersports / Kite surfing\n**Size range:** XS (26-28\"), S (28-30\"), M (30-32\"), L (32-34\"), XL (34-36\")\n\n**Material composition:**\n- Outer shell: 92% recycled nylon 6,6 (ghost-net source)\n- Foam padding: EVA (non-recycled)\n- Hardware: 316 stainless steel spreader bar\n\n**Price:** \u00a3145.00 GBP\n**Inventory:** M=out of stoc",
361
+ "score": 0.4098,
362
+ "source": "pentatonic-memory",
363
+ "doc_id": "sku-kite-harness-v3"
364
+ },
365
+ {
366
+ "text": "# Inventory update \u2014 2026-04-15\n\nPentatonic Crew Tee Black XXS/XXL: discontinued, not restocking.\nNomad Kite Harness v3 M: sold out, restock ETA 2026-05-15.\nHaven Laptop Sleeve 15\": Oat and Ochre sold through, Charcoal only until SS27 refresh.\nAtlas Phone Shell: new batch inbound 2026-04-28, inventory will top up to ~3000 units.\n",
367
+ "score": 0.4032,
368
+ "source": "pentatonic-memory",
369
+ "doc_id": "inventory-update-2026-04-15"
370
+ },
371
+ {
372
+ "text": "# Compatibility note\n\nThe Nomad Kite Harness v3 (NMD-HRN-V3) ships with a standard spreader bar compatible with F-One and North bar systems. For Duotone or Core bar systems, the Duotone/Core adapter kit (NMD-ADPT-DC, \u00a3 18) is required.\n",
373
+ "score": 0.3968,
374
+ "source": "pentatonic-memory",
375
+ "doc_id": "compat-kite-harness-bar"
376
+ }
377
+ ],
378
+ "correct": true,
379
+ "score": 1.0,
380
+ "grading_notes": "all substrings matched",
381
+ "search_time_ms": 492.5855280016549,
382
+ "generation_time_ms": 0.0,
383
+ "tokens_in": 0,
384
+ "tokens_out": 0,
385
+ "retrieval_tokens": 357,
386
+ "query_tokens": 17,
387
+ "context_tokens": 340,
388
+ "judge_tokens_in": 0,
389
+ "judge_tokens_out": 0,
390
+ "judge_latency_ms": 0.0
391
+ },
392
+ {
393
+ "task_id": "sku-kite-harness-restock",
394
+ "query": "When does the Nomad Kite Harness v3 restock for XS and S?",
395
+ "answer": "# Inventory update \u2014 2026-04-15\n\nPentatonic Crew Tee Black XXS/XXL: discontinued, not restocking.\nNomad Kite Harness v3 M: sold out, restock ETA 2026-05-15.\nHaven Laptop Sleeve 15\": Oat and Ochre sold through, Charcoal only until SS27 refresh.\nAtlas Phone Shell: new batch inbound 2026-04-28, inventory will top up to ~3000 units.\n---\n# Nomad Kite Harness v3 \u2014 SKU NMD-HRN-V3\n\n**Brand:** Nomad Sports\n**Category:** Watersports / Kite surfing\n**Size range:** XS (26-28\"), S (28-30\"), M (30-32\"), L (32-34\"), XL (34-36\")\n\n**Material composition:**\n- Outer shell: 92% recycled nylon 6,6 (ghost-net source)\n- Foam padding: EVA (non-recycled)\n- Hardware: 316 stainless steel spreader bar\n\n**Price:** \u00a3145.00 GBP\n**Inventory:** M=out of stock, L=6 units, XL=12 units, XS/S=restock 2026-05-15\n**Repair service:** \u00a325 flat fee, turnaround 14 d\n---\n# Compatibility note\n\nThe Nomad Kite Harness v3 (NMD-HRN-V3) ships with a standard spreader bar compatible with F-One and North bar systems. For Duotone or Core bar systems, the Duotone/Core adapter kit (NMD-ADPT-DC, \u00a3 18) is required.",
396
+ "hits": [
397
+ {
398
+ "text": "# Inventory update \u2014 2026-04-15\n\nPentatonic Crew Tee Black XXS/XXL: discontinued, not restocking.\nNomad Kite Harness v3 M: sold out, restock ETA 2026-05-15.\nHaven Laptop Sleeve 15\": Oat and Ochre sold through, Charcoal only until SS27 refresh.\nAtlas Phone Shell: new batch inbound 2026-04-28, inventory will top up to ~3000 units.\n",
399
+ "score": 0.4098,
400
+ "source": "pentatonic-memory",
401
+ "doc_id": "inventory-update-2026-04-15"
402
+ },
403
+ {
404
+ "text": "# Nomad Kite Harness v3 \u2014 SKU NMD-HRN-V3\n\n**Brand:** Nomad Sports\n**Category:** Watersports / Kite surfing\n**Size range:** XS (26-28\"), S (28-30\"), M (30-32\"), L (32-34\"), XL (34-36\")\n\n**Material composition:**\n- Outer shell: 92% recycled nylon 6,6 (ghost-net source)\n- Foam padding: EVA (non-recycled)\n- Hardware: 316 stainless steel spreader bar\n\n**Price:** \u00a3145.00 GBP\n**Inventory:** M=out of stoc",
405
+ "score": 0.4032,
406
+ "source": "pentatonic-memory",
407
+ "doc_id": "sku-kite-harness-v3"
408
+ },
409
+ {
410
+ "text": "# Compatibility note\n\nThe Nomad Kite Harness v3 (NMD-HRN-V3) ships with a standard spreader bar compatible with F-One and North bar systems. For Duotone or Core bar systems, the Duotone/Core adapter kit (NMD-ADPT-DC, \u00a3 18) is required.\n",
411
+ "score": 0.3968,
412
+ "source": "pentatonic-memory",
413
+ "doc_id": "compat-kite-harness-bar"
414
+ }
415
+ ],
416
+ "correct": true,
417
+ "score": 1.0,
418
+ "grading_notes": "all substrings matched",
419
+ "search_time_ms": 474.821656011045,
420
+ "generation_time_ms": 0.0,
421
+ "tokens_in": 0,
422
+ "tokens_out": 0,
423
+ "retrieval_tokens": 357,
424
+ "query_tokens": 17,
425
+ "context_tokens": 340,
426
+ "judge_tokens_in": 0,
427
+ "judge_tokens_out": 0,
428
+ "judge_latency_ms": 0.0
429
+ },
430
+ {
431
+ "task_id": "sku-tee-discontinued-sizes",
432
+ "query": "Which sizes of the Pentatonic Crew Tee Black are discontinued?",
433
+ "answer": "# Pentatonic Crew Tee Black \u2014 SKU PTT-TEE-BLK\n\n**Brand:** Pentatonic\n**Category:** Apparel / T-shirts\n**Fit:** Unisex regular\n**Size range:** XS, S, M, L, XL, XXL\n\n**Material composition:**\n- 100% GOTS-certified organic cotton, 180 gsm\n- Dyeing: low-impact reactive dye, closed-loop water system\n\n**Price:** \u00a328.00 GBP\n**Inventory:** S=48, M=136, L=94, XL=22, XS=0 (discontinued), XXL=0 (discontinued)\n**Country of origin:** Portugal (CITEVE-certified mill)\n**Care:** Wash cold, line dry; no tumble d\n---\n# Pentatonic Crew Tee Sage \u2014 SKU PTT-TEE-SGE\n\nAs PTT-TEE-BLK but in sage green. Same material composition, same mill.\n\n**Price:** \u00a328.00 GBP\n**Inventory:** S=12, M=38, L=44, XL=8, XS=0, XXL=0\n**Colour note:** Sage is a seasonal SS26 colourway \u2014 not restocked after sell-through.\n---\n# Inventory update \u2014 2026-04-15\n\nPentatonic Crew Tee Black XXS/XXL: discontinued, not restocking.\nNomad Kite Harness v3 M: sold out, restock ETA 2026-05-15.\nHaven Laptop Sleeve 15\": Oat and Ochre sold through, Charcoal only until SS27 refresh.\nAtlas Phone Shell: new batch inbound 2026-04-28, inventory will top up to ~3000 units.",
434
+ "hits": [
435
+ {
436
+ "text": "# Pentatonic Crew Tee Black \u2014 SKU PTT-TEE-BLK\n\n**Brand:** Pentatonic\n**Category:** Apparel / T-shirts\n**Fit:** Unisex regular\n**Size range:** XS, S, M, L, XL, XXL\n\n**Material composition:**\n- 100% GOTS-certified organic cotton, 180 gsm\n- Dyeing: low-impact reactive dye, closed-loop water system\n\n**Price:** \u00a328.00 GBP\n**Inventory:** S=48, M=136, L=94, XL=22, XS=0 (discontinued), XXL=0 (discontinued",
437
+ "score": 0.4098,
438
+ "source": "pentatonic-memory",
439
+ "doc_id": "sku-cotton-tee-black"
440
+ },
441
+ {
442
+ "text": "# Pentatonic Crew Tee Sage \u2014 SKU PTT-TEE-SGE\n\nAs PTT-TEE-BLK but in sage green. Same material composition, same mill.\n\n**Price:** \u00a328.00 GBP\n**Inventory:** S=12, M=38, L=44, XL=8, XS=0, XXL=0\n**Colour note:** Sage is a seasonal SS26 colourway \u2014 not restocked after sell-through.\n",
443
+ "score": 0.4032,
444
+ "source": "pentatonic-memory",
445
+ "doc_id": "sku-cotton-tee-sage"
446
+ },
447
+ {
448
+ "text": "# Inventory update \u2014 2026-04-15\n\nPentatonic Crew Tee Black XXS/XXL: discontinued, not restocking.\nNomad Kite Harness v3 M: sold out, restock ETA 2026-05-15.\nHaven Laptop Sleeve 15\": Oat and Ochre sold through, Charcoal only until SS27 refresh.\nAtlas Phone Shell: new batch inbound 2026-04-28, inventory will top up to ~3000 units.\n",
449
+ "score": 0.3968,
450
+ "source": "pentatonic-memory",
451
+ "doc_id": "inventory-update-2026-04-15"
452
+ }
453
+ ],
454
+ "correct": true,
455
+ "score": 1.0,
456
+ "grading_notes": "all substrings matched",
457
+ "search_time_ms": 483.5939999902621,
458
+ "generation_time_ms": 0.0,
459
+ "tokens_in": 0,
460
+ "tokens_out": 0,
461
+ "retrieval_tokens": 372,
462
+ "query_tokens": 13,
463
+ "context_tokens": 359,
464
+ "judge_tokens_in": 0,
465
+ "judge_tokens_out": 0,
466
+ "judge_latency_ms": 0.0
467
+ },
468
+ {
469
+ "task_id": "sku-sleeve-compat-14-mbp",
470
+ "query": "Does the Haven Laptop Sleeve 13\" fit a 14\" MacBook Pro?",
471
+ "answer": "# Compatibility note\n\nThe Haven Laptop Sleeve 13\" (HVN-SLV-13) does NOT fit the 14\" MacBook Pro \u2014 third-party dimensions exceed 31.5cm. Use the 15\" variant (HVN-SLV-15).\n---\n# Haven Laptop Sleeve 15\" \u2014 SKU HVN-SLV-15\n\nAs HVN-SLV-13 but for 15\"-16\" laptops. Same materials, same construction.\n\n**Fits:** 15\" MacBook Air, 16\" MacBook Pro, 15.6\" Dell XPS, 15\" ThinkPad\n**Price:** \u00a358.00 GBP (\u00a310 more than 13\" variant)\n**Inventory:** 89 units UK, 54 units EU\n**Colours available:** Charcoal only (Oat and Ochre sold through)\n---\n# Haven Laptop Sleeve 13\" \u2014 SKU HVN-SLV-13\n\n**Brand:** Haven\n**Category:** Bags / Laptop protection\n**Fits:** 13\" MacBook Air M2/M3, 13.6\" MacBook Air, 13\" Dell XPS, 13\" ThinkPad\n\n**Material composition:**\n- Outer: 100% recycled PET felt (from 12 plastic bottles per unit)\n- Inner lining: 100% post-consumer recycled polyester\n- YKK recycled-polyester zip\n\n**Price:** \u00a348.00 GBP\n**Inventory:** 238 units UK, 156 units EU\n**Colours available:** Charcoal, Oat, Ochre\n**Laptop diagonal max:** 13.6\" (thi",
472
+ "hits": [
473
+ {
474
+ "text": "# Compatibility note\n\nThe Haven Laptop Sleeve 13\" (HVN-SLV-13) does NOT fit the 14\" MacBook Pro \u2014 third-party dimensions exceed 31.5cm. Use the 15\" variant (HVN-SLV-15).\n",
475
+ "score": 0.4098,
476
+ "source": "pentatonic-memory",
477
+ "doc_id": "compat-laptop-sleeve-macbook-pro-14"
478
+ },
479
+ {
480
+ "text": "# Haven Laptop Sleeve 15\" \u2014 SKU HVN-SLV-15\n\nAs HVN-SLV-13 but for 15\"-16\" laptops. Same materials, same construction.\n\n**Fits:** 15\" MacBook Air, 16\" MacBook Pro, 15.6\" Dell XPS, 15\" ThinkPad\n**Price:** \u00a358.00 GBP (\u00a310 more than 13\" variant)\n**Inventory:** 89 units UK, 54 units EU\n**Colours available:** Charcoal only (Oat and Ochre sold through)\n",
481
+ "score": 0.4032,
482
+ "source": "pentatonic-memory",
483
+ "doc_id": "sku-laptop-sleeve-15"
484
+ },
485
+ {
486
+ "text": "# Haven Laptop Sleeve 13\" \u2014 SKU HVN-SLV-13\n\n**Brand:** Haven\n**Category:** Bags / Laptop protection\n**Fits:** 13\" MacBook Air M2/M3, 13.6\" MacBook Air, 13\" Dell XPS, 13\" ThinkPad\n\n**Material composition:**\n- Outer: 100% recycled PET felt (from 12 plastic bottles per unit)\n- Inner lining: 100% post-consumer recycled polyester\n- YKK recycled-polyester zip\n\n**Price:** \u00a348.00 GBP\n**Inventory:** 238 un",
487
+ "score": 0.3968,
488
+ "source": "pentatonic-memory",
489
+ "doc_id": "sku-laptop-sleeve-13"
490
+ }
491
+ ],
492
+ "correct": true,
493
+ "score": 1.0,
494
+ "grading_notes": "all substrings matched",
495
+ "search_time_ms": 493.95382299553603,
496
+ "generation_time_ms": 0.0,
497
+ "tokens_in": 0,
498
+ "tokens_out": 0,
499
+ "retrieval_tokens": 348,
500
+ "query_tokens": 16,
501
+ "context_tokens": 332,
502
+ "judge_tokens_in": 0,
503
+ "judge_tokens_out": 0,
504
+ "judge_latency_ms": 0.0
505
+ },
506
+ {
507
+ "task_id": "sku-coffee-cup-microwave",
508
+ "query": "Can I microwave the Loop coffee cup?",
509
+ "answer": "# Loop Reusable Coffee Cup 8oz \u2014 SKU LP-CUP-008\n\n**Brand:** Loop\n**Category:** Drinkware / Coffee\n**Capacity:** 8oz (240ml)\n\n**Material composition:**\n- Body: 100% plant-based PLA (corn-derived)\n- Silicone sleeve: food-grade silicone (not bio-based)\n- Lid: BPA-free polypropylene (recycled post-industrial)\n\n**Price:** \u00a312.50 GBP\n**Inventory:** 2,104 units UK, 1,876 units EU\n**Dishwasher safe:** Top rack only\n**Lifespan:** ~2 years regular use, then return for closed-loop composting\n**Note:** Not\n---\n# Luna Water Bottle 500ml \u2014 SKU LUN-BTL-042\n\n**Brand:** Luna\n**Category:** Drinkware / Bottles\n**Capacity:** 500ml\n\n**Material composition:**\n- 100% food-grade 304 stainless steel (65% recycled content)\n- Lid: bio-based silicone (sugarcane derivative)\n\n**Price:** \u00a318.50 GBP\n**Inventory:** 87 units in stock (UK), 412 units (EU DC Eindhoven)\n**Colours available:** Matte black, Sage green, Terracotta\n**Replacement parts:** Lid (\u00a33.50), Silicone seal (\u00a30.90)\n**Warranty:** Lifetime on body, 2 years o",
510
+ "hits": [
511
+ {
512
+ "text": "# Loop Reusable Coffee Cup 8oz \u2014 SKU LP-CUP-008\n\n**Brand:** Loop\n**Category:** Drinkware / Coffee\n**Capacity:** 8oz (240ml)\n\n**Material composition:**\n- Body: 100% plant-based PLA (corn-derived)\n- Silicone sleeve: food-grade silicone (not bio-based)\n- Lid: BPA-free polypropylene (recycled post-industrial)\n\n**Price:** \u00a312.50 GBP\n**Inventory:** 2,104 units UK, 1,876 units EU\n**Dishwasher safe:** Top",
513
+ "score": 0.4098,
514
+ "source": "pentatonic-memory",
515
+ "doc_id": "sku-coffee-cup-reusable"
516
+ },
517
+ {
518
+ "text": "# Luna Water Bottle 500ml \u2014 SKU LUN-BTL-042\n\n**Brand:** Luna\n**Category:** Drinkware / Bottles\n**Capacity:** 500ml\n\n**Material composition:**\n- 100% food-grade 304 stainless steel (65% recycled content)\n- Lid: bio-based silicone (sugarcane derivative)\n\n**Price:** \u00a318.50 GBP\n**Inventory:** 87 units in stock (UK), 412 units (EU DC Eindhoven)\n**Colours available:** Matte black, Sage green, Terracotta",
519
+ "score": 0.3846,
520
+ "source": "pentatonic-memory",
521
+ "doc_id": "sku-luna-bottle-42"
522
+ }
523
+ ],
524
+ "correct": false,
525
+ "score": 0.5,
526
+ "grading_notes": "missing 1/2: ['Not microwave-safe']",
527
+ "search_time_ms": 458.2784629892558,
528
+ "generation_time_ms": 0.0,
529
+ "tokens_in": 0,
530
+ "tokens_out": 0,
531
+ "retrieval_tokens": 299,
532
+ "query_tokens": 8,
533
+ "context_tokens": 291,
534
+ "judge_tokens_in": 0,
535
+ "judge_tokens_out": 0,
536
+ "judge_latency_ms": 0.0
537
+ },
538
+ {
539
+ "task_id": "sku-bin-liners-home-compost",
540
+ "query": "Are the Root bio bin liners home-compostable?",
541
+ "answer": "# Bio Bin Liners 30L (roll of 20) \u2014 SKU BBL-030-020\n\n**Brand:** Root\n**Category:** Home / Waste\n**Size:** 30 litres\n\n**Material composition:**\n- 100% PBAT + corn starch biopolymer\n- EN13432 certified industrially compostable\n- NOT home-compostable (requires industrial composting temperatures)\n\n**Price:** \u00a34.20 GBP per roll\n**Inventory:** 6,420 rolls UK, 2,100 rolls EU\n**Subscription:** Monthly auto-delivery available (\u00a33.60/roll)\n**Council scheme compatibility:** Check with your local authority\n---\n# Loop Reusable Coffee Cup 8oz \u2014 SKU LP-CUP-008\n\n**Brand:** Loop\n**Category:** Drinkware / Coffee\n**Capacity:** 8oz (240ml)\n\n**Material composition:**\n- Body: 100% plant-based PLA (corn-derived)\n- Silicone sleeve: food-grade silicone (not bio-based)\n- Lid: BPA-free polypropylene (recycled post-industrial)\n\n**Price:** \u00a312.50 GBP\n**Inventory:** 2,104 units UK, 1,876 units EU\n**Dishwasher safe:** Top rack only\n**Lifespan:** ~2 years regular use, then return for closed-loop composting\n**Note:** Not",
542
+ "hits": [
543
+ {
544
+ "text": "# Bio Bin Liners 30L (roll of 20) \u2014 SKU BBL-030-020\n\n**Brand:** Root\n**Category:** Home / Waste\n**Size:** 30 litres\n\n**Material composition:**\n- 100% PBAT + corn starch biopolymer\n- EN13432 certified industrially compostable\n- NOT home-compostable (requires industrial composting temperatures)\n\n**Price:** \u00a34.20 GBP per roll\n**Inventory:** 6,420 rolls UK, 2,100 rolls EU\n**Subscription:** Monthly aut",
545
+ "score": 0.4098,
546
+ "source": "pentatonic-memory",
547
+ "doc_id": "sku-biodegradable-trash-bags"
548
+ },
549
+ {
550
+ "text": "# Loop Reusable Coffee Cup 8oz \u2014 SKU LP-CUP-008\n\n**Brand:** Loop\n**Category:** Drinkware / Coffee\n**Capacity:** 8oz (240ml)\n\n**Material composition:**\n- Body: 100% plant-based PLA (corn-derived)\n- Silicone sleeve: food-grade silicone (not bio-based)\n- Lid: BPA-free polypropylene (recycled post-industrial)\n\n**Price:** \u00a312.50 GBP\n**Inventory:** 2,104 units UK, 1,876 units EU\n**Dishwasher safe:** Top",
551
+ "score": 0.3788,
552
+ "source": "pentatonic-memory",
553
+ "doc_id": "sku-coffee-cup-reusable"
554
+ }
555
+ ],
556
+ "correct": true,
557
+ "score": 1.0,
558
+ "grading_notes": "all substrings matched",
559
+ "search_time_ms": 448.9738449919969,
560
+ "generation_time_ms": 0.0,
561
+ "tokens_in": 0,
562
+ "tokens_out": 0,
563
+ "retrieval_tokens": 294,
564
+ "query_tokens": 11,
565
+ "context_tokens": 283,
566
+ "judge_tokens_in": 0,
567
+ "judge_tokens_out": 0,
568
+ "judge_latency_ms": 0.0
569
+ },
570
+ {
571
+ "task_id": "policy-custom-tote-return",
572
+ "query": "Can I return a custom-printed tote bag?",
573
+ "answer": "# Returns policy\n\nAll unused items returnable within 30 days of delivery for full refund.\nItems returned after 30 days but under 90 days: store credit only.\nTake-back programme is separate \u2014 applies to any lifetime-warrantied item at end of useful life.\nExceptions: custom-printed items (e.g. custom tote bags) and consumables (e.g. bin liners) are final sale.\n---\n# Canvas Tote Bag Large \u2014 SKU CTB-LG-001\n\n**Brand:** Fern\n**Category:** Bags / Totes\n**Dimensions:** 38cm \u00d7 42cm \u00d7 12cm (handle drop 25cm)\n**Capacity:** 16 litres\n\n**Material composition:**\n- 100% organic cotton canvas, 340 gsm\n- Handles: woven cotton webbing, reinforced with bartack stitching\n\n**Price:** \u00a322.00 GBP\n**Inventory:** 1,580 units UK\n**Print options:** Blank, Logo, Custom (+\u00a35 per unit, MOQ 12)\n**Max load:** 15kg",
574
+ "hits": [
575
+ {
576
+ "text": "# Returns policy\n\nAll unused items returnable within 30 days of delivery for full refund.\nItems returned after 30 days but under 90 days: store credit only.\nTake-back programme is separate \u2014 applies to any lifetime-warrantied item at end of useful life.\nExceptions: custom-printed items (e.g. custom tote bags) and consumables (e.g. bin liners) are final sale.\n",
577
+ "score": 0.4098,
578
+ "source": "pentatonic-memory",
579
+ "doc_id": "policy-returns-30day"
580
+ },
581
+ {
582
+ "text": "# Canvas Tote Bag Large \u2014 SKU CTB-LG-001\n\n**Brand:** Fern\n**Category:** Bags / Totes\n**Dimensions:** 38cm \u00d7 42cm \u00d7 12cm (handle drop 25cm)\n**Capacity:** 16 litres\n\n**Material composition:**\n- 100% organic cotton canvas, 340 gsm\n- Handles: woven cotton webbing, reinforced with bartack stitching\n\n**Price:** \u00a322.00 GBP\n**Inventory:** 1,580 units UK\n**Print options:** Blank, Logo, Custom (+\u00a35 per unit",
583
+ "score": 0.3846,
584
+ "source": "pentatonic-memory",
585
+ "doc_id": "sku-tote-canvas-large"
586
+ }
587
+ ],
588
+ "correct": true,
589
+ "score": 1.0,
590
+ "grading_notes": "all substrings matched",
591
+ "search_time_ms": 452.81719000195153,
592
+ "generation_time_ms": 0.0,
593
+ "tokens_in": 0,
594
+ "tokens_out": 0,
595
+ "retrieval_tokens": 228,
596
+ "query_tokens": 10,
597
+ "context_tokens": 218,
598
+ "judge_tokens_in": 0,
599
+ "judge_tokens_out": 0,
600
+ "judge_latency_ms": 0.0
601
+ },
602
+ {
603
+ "task_id": "price-tee-subscription",
604
+ "query": "What's the subscription price for the Luna water bottle compared to standard?",
605
+ "answer": "# Luna Water Bottle 500ml \u2014 SKU LUN-BTL-042\n\n**Brand:** Luna\n**Category:** Drinkware / Bottles\n**Capacity:** 500ml\n\n**Material composition:**\n- 100% food-grade 304 stainless steel (65% recycled content)\n- Lid: bio-based silicone (sugarcane derivative)\n\n**Price:** \u00a318.50 GBP\n**Inventory:** 87 units in stock (UK), 412 units (EU DC Eindhoven)\n**Colours available:** Matte black, Sage green, Terracotta\n**Replacement parts:** Lid (\u00a33.50), Silicone seal (\u00a30.90)\n**Warranty:** Lifetime on body, 2 years o\n---\n# Pricing tiers across catalogue\n\nStandard: list price as shown on PDP.\nSubscription: auto-ships every N weeks, typically 15% off standard.\nBulk (B2B): tiered discount starting at MOQ 50 units, call sales@pentatonic.com.\nTake-back credit: 50% of original price as store credit when returned via take-back programme.",
606
+ "hits": [
607
+ {
608
+ "text": "# Luna Water Bottle 500ml \u2014 SKU LUN-BTL-042\n\n**Brand:** Luna\n**Category:** Drinkware / Bottles\n**Capacity:** 500ml\n\n**Material composition:**\n- 100% food-grade 304 stainless steel (65% recycled content)\n- Lid: bio-based silicone (sugarcane derivative)\n\n**Price:** \u00a318.50 GBP\n**Inventory:** 87 units in stock (UK), 412 units (EU DC Eindhoven)\n**Colours available:** Matte black, Sage green, Terracotta",
609
+ "score": 0.4098,
610
+ "source": "pentatonic-memory",
611
+ "doc_id": "sku-luna-bottle-42"
612
+ },
613
+ {
614
+ "text": "# Pricing tiers across catalogue\n\nStandard: list price as shown on PDP.\nSubscription: auto-ships every N weeks, typically 15% off standard.\nBulk (B2B): tiered discount starting at MOQ 50 units, call sales@pentatonic.com.\nTake-back credit: 50% of original price as store credit when returned via take-back programme.\n",
615
+ "score": 0.4032,
616
+ "source": "pentatonic-memory",
617
+ "doc_id": "price-tiers-all"
618
+ }
619
+ ],
620
+ "correct": true,
621
+ "score": 1.0,
622
+ "grading_notes": "all substrings matched",
623
+ "search_time_ms": 499.92061901139095,
624
+ "generation_time_ms": 0.0,
625
+ "tokens_in": 0,
626
+ "tokens_out": 0,
627
+ "retrieval_tokens": 237,
628
+ "query_tokens": 14,
629
+ "context_tokens": 223,
630
+ "judge_tokens_in": 0,
631
+ "judge_tokens_out": 0,
632
+ "judge_latency_ms": 0.0
633
+ },
634
+ {
635
+ "task_id": "price-sleeve-diff",
636
+ "query": "How much more does the 15\" Haven Laptop Sleeve cost than the 13\" variant?",
637
+ "answer": "# Haven Laptop Sleeve 15\" \u2014 SKU HVN-SLV-15\n\nAs HVN-SLV-13 but for 15\"-16\" laptops. Same materials, same construction.\n\n**Fits:** 15\" MacBook Air, 16\" MacBook Pro, 15.6\" Dell XPS, 15\" ThinkPad\n**Price:** \u00a358.00 GBP (\u00a310 more than 13\" variant)\n**Inventory:** 89 units UK, 54 units EU\n**Colours available:** Charcoal only (Oat and Ochre sold through)\n---\n# Compatibility note\n\nThe Haven Laptop Sleeve 13\" (HVN-SLV-13) does NOT fit the 14\" MacBook Pro \u2014 third-party dimensions exceed 31.5cm. Use the 15\" variant (HVN-SLV-15).\n---\n# Haven Laptop Sleeve 13\" \u2014 SKU HVN-SLV-13\n\n**Brand:** Haven\n**Category:** Bags / Laptop protection\n**Fits:** 13\" MacBook Air M2/M3, 13.6\" MacBook Air, 13\" Dell XPS, 13\" ThinkPad\n\n**Material composition:**\n- Outer: 100% recycled PET felt (from 12 plastic bottles per unit)\n- Inner lining: 100% post-consumer recycled polyester\n- YKK recycled-polyester zip\n\n**Price:** \u00a348.00 GBP\n**Inventory:** 238 units UK, 156 units EU\n**Colours available:** Charcoal, Oat, Ochre\n**Laptop diagonal max:** 13.6\" (thi",
638
+ "hits": [
639
+ {
640
+ "text": "# Haven Laptop Sleeve 15\" \u2014 SKU HVN-SLV-15\n\nAs HVN-SLV-13 but for 15\"-16\" laptops. Same materials, same construction.\n\n**Fits:** 15\" MacBook Air, 16\" MacBook Pro, 15.6\" Dell XPS, 15\" ThinkPad\n**Price:** \u00a358.00 GBP (\u00a310 more than 13\" variant)\n**Inventory:** 89 units UK, 54 units EU\n**Colours available:** Charcoal only (Oat and Ochre sold through)\n",
641
+ "score": 0.4098,
642
+ "source": "pentatonic-memory",
643
+ "doc_id": "sku-laptop-sleeve-15"
644
+ },
645
+ {
646
+ "text": "# Compatibility note\n\nThe Haven Laptop Sleeve 13\" (HVN-SLV-13) does NOT fit the 14\" MacBook Pro \u2014 third-party dimensions exceed 31.5cm. Use the 15\" variant (HVN-SLV-15).\n",
647
+ "score": 0.4032,
648
+ "source": "pentatonic-memory",
649
+ "doc_id": "compat-laptop-sleeve-macbook-pro-14"
650
+ },
651
+ {
652
+ "text": "# Haven Laptop Sleeve 13\" \u2014 SKU HVN-SLV-13\n\n**Brand:** Haven\n**Category:** Bags / Laptop protection\n**Fits:** 13\" MacBook Air M2/M3, 13.6\" MacBook Air, 13\" Dell XPS, 13\" ThinkPad\n\n**Material composition:**\n- Outer: 100% recycled PET felt (from 12 plastic bottles per unit)\n- Inner lining: 100% post-consumer recycled polyester\n- YKK recycled-polyester zip\n\n**Price:** \u00a348.00 GBP\n**Inventory:** 238 un",
653
+ "score": 0.3968,
654
+ "source": "pentatonic-memory",
655
+ "doc_id": "sku-laptop-sleeve-13"
656
+ }
657
+ ],
658
+ "correct": true,
659
+ "score": 1.0,
660
+ "grading_notes": "all substrings matched",
661
+ "search_time_ms": 560.5700919986703,
662
+ "generation_time_ms": 0.0,
663
+ "tokens_in": 0,
664
+ "tokens_out": 0,
665
+ "retrieval_tokens": 351,
666
+ "query_tokens": 19,
667
+ "context_tokens": 332,
668
+ "judge_tokens_in": 0,
669
+ "judge_tokens_out": 0,
670
+ "judge_latency_ms": 0.0
671
+ },
672
+ {
673
+ "task_id": "multi-hop-kite-duotone",
674
+ "query": "I have a Duotone bar \u2014 will the Nomad Kite Harness v3 work with it out of the box?",
675
+ "answer": "# Compatibility note\n\nThe Nomad Kite Harness v3 (NMD-HRN-V3) ships with a standard spreader bar compatible with F-One and North bar systems. For Duotone or Core bar systems, the Duotone/Core adapter kit (NMD-ADPT-DC, \u00a3 18) is required.\n---\n# Nomad Kite Harness v3 \u2014 SKU NMD-HRN-V3\n\n**Brand:** Nomad Sports\n**Category:** Watersports / Kite surfing\n**Size range:** XS (26-28\"), S (28-30\"), M (30-32\"), L (32-34\"), XL (34-36\")\n\n**Material composition:**\n- Outer shell: 92% recycled nylon 6,6 (ghost-net source)\n- Foam padding: EVA (non-recycled)\n- Hardware: 316 stainless steel spreader bar\n\n**Price:** \u00a3145.00 GBP\n**Inventory:** M=out of stock, L=6 units, XL=12 units, XS/S=restock 2026-05-15\n**Repair service:** \u00a325 flat fee, turnaround 14 d\n---\n# Inventory update \u2014 2026-04-15\n\nPentatonic Crew Tee Black XXS/XXL: discontinued, not restocking.\nNomad Kite Harness v3 M: sold out, restock ETA 2026-05-15.\nHaven Laptop Sleeve 15\": Oat and Ochre sold through, Charcoal only until SS27 refresh.\nAtlas Phone Shell: new batch inbound 2026-04-28, inventory will top up to ~3000 units.",
676
+ "hits": [
677
+ {
678
+ "text": "# Compatibility note\n\nThe Nomad Kite Harness v3 (NMD-HRN-V3) ships with a standard spreader bar compatible with F-One and North bar systems. For Duotone or Core bar systems, the Duotone/Core adapter kit (NMD-ADPT-DC, \u00a3 18) is required.\n",
679
+ "score": 0.4098,
680
+ "source": "pentatonic-memory",
681
+ "doc_id": "compat-kite-harness-bar"
682
+ },
683
+ {
684
+ "text": "# Nomad Kite Harness v3 \u2014 SKU NMD-HRN-V3\n\n**Brand:** Nomad Sports\n**Category:** Watersports / Kite surfing\n**Size range:** XS (26-28\"), S (28-30\"), M (30-32\"), L (32-34\"), XL (34-36\")\n\n**Material composition:**\n- Outer shell: 92% recycled nylon 6,6 (ghost-net source)\n- Foam padding: EVA (non-recycled)\n- Hardware: 316 stainless steel spreader bar\n\n**Price:** \u00a3145.00 GBP\n**Inventory:** M=out of stoc",
685
+ "score": 0.3968,
686
+ "source": "pentatonic-memory",
687
+ "doc_id": "sku-kite-harness-v3"
688
+ },
689
+ {
690
+ "text": "# Inventory update \u2014 2026-04-15\n\nPentatonic Crew Tee Black XXS/XXL: discontinued, not restocking.\nNomad Kite Harness v3 M: sold out, restock ETA 2026-05-15.\nHaven Laptop Sleeve 15\": Oat and Ochre sold through, Charcoal only until SS27 refresh.\nAtlas Phone Shell: new batch inbound 2026-04-28, inventory will top up to ~3000 units.\n",
691
+ "score": 0.3846,
692
+ "source": "pentatonic-memory",
693
+ "doc_id": "inventory-update-2026-04-15"
694
+ }
695
+ ],
696
+ "correct": true,
697
+ "score": 1.0,
698
+ "grading_notes": "all substrings matched",
699
+ "search_time_ms": 493.0140280048363,
700
+ "generation_time_ms": 0.0,
701
+ "tokens_in": 0,
702
+ "tokens_out": 0,
703
+ "retrieval_tokens": 365,
704
+ "query_tokens": 25,
705
+ "context_tokens": 340,
706
+ "judge_tokens_in": 0,
707
+ "judge_tokens_out": 0,
708
+ "judge_latency_ms": 0.0
709
+ },
710
+ {
711
+ "task_id": "multi-hop-takeback-credit",
712
+ "query": "If I return an Atlas Phone Shell via take-back after 2 years, how much store credit do I get?",
713
+ "answer": "# Atlas Phone Shell \u2014 SKU ATL-PHN-001\n\n**Brand:** Atlas Circular\n**Category:** Mobile accessories / Phone cases\n**Compatible with:** iPhone 15, iPhone 15 Pro\n\n**Material composition:**\n- 68% recycled ocean-bound polypropylene\n- 24% recycled polycarbonate (post-consumer)\n- 8% natural calcium carbonate\n\n**Price:** \u00a329.00 GBP (standard) / \u00a324.00 (subscription)\n**Inventory:** 1,240 units in stock at UK fulfilment (Worthing DC)\n**Take-back:** Yes \u2014 returnable for 50% credit after 18 months\n**Certific\n---\n# Pricing tiers across catalogue\n\nStandard: list price as shown on PDP.\nSubscription: auto-ships every N weeks, typically 15% off standard.\nBulk (B2B): tiered discount starting at MOQ 50 units, call sales@pentatonic.com.\nTake-back credit: 50% of original price as store credit when returned via take-back programme.\n---\n# Returns policy\n\nAll unused items returnable within 30 days of delivery for full refund.\nItems returned after 30 days but under 90 days: store credit only.\nTake-back programme is separate \u2014 applies to any lifetime-warrantied item at end of useful life.\nExceptions: custom-printed items (e.g. custom tote bags) and consumables (e.g. bin liners) are final sale.",
714
+ "hits": [
715
+ {
716
+ "text": "# Atlas Phone Shell \u2014 SKU ATL-PHN-001\n\n**Brand:** Atlas Circular\n**Category:** Mobile accessories / Phone cases\n**Compatible with:** iPhone 15, iPhone 15 Pro\n\n**Material composition:**\n- 68% recycled ocean-bound polypropylene\n- 24% recycled polycarbonate (post-consumer)\n- 8% natural calcium carbonate\n\n**Price:** \u00a329.00 GBP (standard) / \u00a324.00 (subscription)\n**Inventory:** 1,240 units in stock at U",
717
+ "score": 0.4032,
718
+ "source": "pentatonic-memory",
719
+ "doc_id": "sku-atlas-phone-01"
720
+ },
721
+ {
722
+ "text": "# Pricing tiers across catalogue\n\nStandard: list price as shown on PDP.\nSubscription: auto-ships every N weeks, typically 15% off standard.\nBulk (B2B): tiered discount starting at MOQ 50 units, call sales@pentatonic.com.\nTake-back credit: 50% of original price as store credit when returned via take-back programme.\n",
723
+ "score": 0.3906,
724
+ "source": "pentatonic-memory",
725
+ "doc_id": "price-tiers-all"
726
+ },
727
+ {
728
+ "text": "# Returns policy\n\nAll unused items returnable within 30 days of delivery for full refund.\nItems returned after 30 days but under 90 days: store credit only.\nTake-back programme is separate \u2014 applies to any lifetime-warrantied item at end of useful life.\nExceptions: custom-printed items (e.g. custom tote bags) and consumables (e.g. bin liners) are final sale.\n",
729
+ "score": 0.3846,
730
+ "source": "pentatonic-memory",
731
+ "doc_id": "policy-returns-30day"
732
+ }
733
+ ],
734
+ "correct": false,
735
+ "score": 0.0,
736
+ "grading_notes": "missing 1/2: ['14.50']; forbidden substring(s) present: ['\u00a329', '\u00a324']",
737
+ "search_time_ms": 535.9368770150468,
738
+ "generation_time_ms": 0.0,
739
+ "tokens_in": 0,
740
+ "tokens_out": 0,
741
+ "retrieval_tokens": 323,
742
+ "query_tokens": 23,
743
+ "context_tokens": 300,
744
+ "judge_tokens_in": 0,
745
+ "judge_tokens_out": 0,
746
+ "judge_latency_ms": 0.0
747
+ },
748
+ {
749
+ "task_id": "rubric-recommend-kitesurf-bag",
750
+ "query": "I'm heading to Worthing for a kite session and need to carry my 15\" MacBook and some kit. What would you recommend from the catalogue?",
751
+ "answer": "# Haven Laptop Sleeve 15\" \u2014 SKU HVN-SLV-15\n\nAs HVN-SLV-13 but for 15\"-16\" laptops. Same materials, same construction.\n\n**Fits:** 15\" MacBook Air, 16\" MacBook Pro, 15.6\" Dell XPS, 15\" ThinkPad\n**Price:** \u00a358.00 GBP (\u00a310 more than 13\" variant)\n**Inventory:** 89 units UK, 54 units EU\n**Colours available:** Charcoal only (Oat and Ochre sold through)\n---\n# Inventory update \u2014 2026-04-15\n\nPentatonic Crew Tee Black XXS/XXL: discontinued, not restocking.\nNomad Kite Harness v3 M: sold out, restock ETA 2026-05-15.\nHaven Laptop Sleeve 15\": Oat and Ochre sold through, Charcoal only until SS27 refresh.\nAtlas Phone Shell: new batch inbound 2026-04-28, inventory will top up to ~3000 units.\n---\n# Haven Laptop Sleeve 13\" \u2014 SKU HVN-SLV-13\n\n**Brand:** Haven\n**Category:** Bags / Laptop protection\n**Fits:** 13\" MacBook Air M2/M3, 13.6\" MacBook Air, 13\" Dell XPS, 13\" ThinkPad\n\n**Material composition:**\n- Outer: 100% recycled PET felt (from 12 plastic bottles per unit)\n- Inner lining: 100% post-consumer recycled polyester\n- YKK recycled-polyester zip\n\n**Price:** \u00a348.00 GBP\n**Inventory:** 238 units UK, 156 units EU\n**Colours available:** Charcoal, Oat, Ochre\n**Laptop diagonal max:** 13.6\" (thi",
752
+ "hits": [
753
+ {
754
+ "text": "# Haven Laptop Sleeve 15\" \u2014 SKU HVN-SLV-15\n\nAs HVN-SLV-13 but for 15\"-16\" laptops. Same materials, same construction.\n\n**Fits:** 15\" MacBook Air, 16\" MacBook Pro, 15.6\" Dell XPS, 15\" ThinkPad\n**Price:** \u00a358.00 GBP (\u00a310 more than 13\" variant)\n**Inventory:** 89 units UK, 54 units EU\n**Colours available:** Charcoal only (Oat and Ochre sold through)\n",
755
+ "score": 0.4098,
756
+ "source": "pentatonic-memory",
757
+ "doc_id": "sku-laptop-sleeve-15"
758
+ },
759
+ {
760
+ "text": "# Inventory update \u2014 2026-04-15\n\nPentatonic Crew Tee Black XXS/XXL: discontinued, not restocking.\nNomad Kite Harness v3 M: sold out, restock ETA 2026-05-15.\nHaven Laptop Sleeve 15\": Oat and Ochre sold through, Charcoal only until SS27 refresh.\nAtlas Phone Shell: new batch inbound 2026-04-28, inventory will top up to ~3000 units.\n",
761
+ "score": 0.3968,
762
+ "source": "pentatonic-memory",
763
+ "doc_id": "inventory-update-2026-04-15"
764
+ },
765
+ {
766
+ "text": "# Haven Laptop Sleeve 13\" \u2014 SKU HVN-SLV-13\n\n**Brand:** Haven\n**Category:** Bags / Laptop protection\n**Fits:** 13\" MacBook Air M2/M3, 13.6\" MacBook Air, 13\" Dell XPS, 13\" ThinkPad\n\n**Material composition:**\n- Outer: 100% recycled PET felt (from 12 plastic bottles per unit)\n- Inner lining: 100% post-consumer recycled polyester\n- YKK recycled-polyester zip\n\n**Price:** \u00a348.00 GBP\n**Inventory:** 238 un",
767
+ "score": 0.3906,
768
+ "source": "pentatonic-memory",
769
+ "doc_id": "sku-laptop-sleeve-13"
770
+ }
771
+ ],
772
+ "correct": false,
773
+ "score": 0.0,
774
+ "grading_notes": "judge-error: judge did not return parseable JSON",
775
+ "search_time_ms": 474.2175440187566,
776
+ "generation_time_ms": 0.0,
777
+ "tokens_in": 0,
778
+ "tokens_out": 0,
779
+ "retrieval_tokens": 413,
780
+ "query_tokens": 31,
781
+ "context_tokens": 382,
782
+ "judge_tokens_in": 724,
783
+ "judge_tokens_out": 51,
784
+ "judge_latency_ms": 1100.580383002758
785
+ },
786
+ {
787
+ "task_id": "rubric-plastic-free-tee",
788
+ "query": "Which tees in the catalogue are completely plastic-free?",
789
+ "answer": "# Pentatonic Crew Tee Black \u2014 SKU PTT-TEE-BLK\n\n**Brand:** Pentatonic\n**Category:** Apparel / T-shirts\n**Fit:** Unisex regular\n**Size range:** XS, S, M, L, XL, XXL\n\n**Material composition:**\n- 100% GOTS-certified organic cotton, 180 gsm\n- Dyeing: low-impact reactive dye, closed-loop water system\n\n**Price:** \u00a328.00 GBP\n**Inventory:** S=48, M=136, L=94, XL=22, XS=0 (discontinued), XXL=0 (discontinued)\n**Country of origin:** Portugal (CITEVE-certified mill)\n**Care:** Wash cold, line dry; no tumble d\n---\n# Pentatonic Crew Tee Sage \u2014 SKU PTT-TEE-SGE\n\nAs PTT-TEE-BLK but in sage green. Same material composition, same mill.\n\n**Price:** \u00a328.00 GBP\n**Inventory:** S=12, M=38, L=44, XL=8, XS=0, XXL=0\n**Colour note:** Sage is a seasonal SS26 colourway \u2014 not restocked after sell-through.\n---\n# Atlas Phone Shell \u2014 SKU ATL-PHN-001\n\n**Brand:** Atlas Circular\n**Category:** Mobile accessories / Phone cases\n**Compatible with:** iPhone 15, iPhone 15 Pro\n\n**Material composition:**\n- 68% recycled ocean-bound polypropylene\n- 24% recycled polycarbonate (post-consumer)\n- 8% natural calcium carbonate\n\n**Price:** \u00a329.00 GBP (standard) / \u00a324.00 (subscription)\n**Inventory:** 1,240 units in stock at UK fulfilment (Worthing DC)\n**Take-back:** Yes \u2014 returnable for 50% credit after 18 months\n**Certific",
790
+ "hits": [
791
+ {
792
+ "text": "# Pentatonic Crew Tee Black \u2014 SKU PTT-TEE-BLK\n\n**Brand:** Pentatonic\n**Category:** Apparel / T-shirts\n**Fit:** Unisex regular\n**Size range:** XS, S, M, L, XL, XXL\n\n**Material composition:**\n- 100% GOTS-certified organic cotton, 180 gsm\n- Dyeing: low-impact reactive dye, closed-loop water system\n\n**Price:** \u00a328.00 GBP\n**Inventory:** S=48, M=136, L=94, XL=22, XS=0 (discontinued), XXL=0 (discontinued",
793
+ "score": 0.4098,
794
+ "source": "pentatonic-memory",
795
+ "doc_id": "sku-cotton-tee-black"
796
+ },
797
+ {
798
+ "text": "# Pentatonic Crew Tee Sage \u2014 SKU PTT-TEE-SGE\n\nAs PTT-TEE-BLK but in sage green. Same material composition, same mill.\n\n**Price:** \u00a328.00 GBP\n**Inventory:** S=12, M=38, L=44, XL=8, XS=0, XXL=0\n**Colour note:** Sage is a seasonal SS26 colourway \u2014 not restocked after sell-through.\n",
799
+ "score": 0.3968,
800
+ "source": "pentatonic-memory",
801
+ "doc_id": "sku-cotton-tee-sage"
802
+ },
803
+ {
804
+ "text": "# Atlas Phone Shell \u2014 SKU ATL-PHN-001\n\n**Brand:** Atlas Circular\n**Category:** Mobile accessories / Phone cases\n**Compatible with:** iPhone 15, iPhone 15 Pro\n\n**Material composition:**\n- 68% recycled ocean-bound polypropylene\n- 24% recycled polycarbonate (post-consumer)\n- 8% natural calcium carbonate\n\n**Price:** \u00a329.00 GBP (standard) / \u00a324.00 (subscription)\n**Inventory:** 1,240 units in stock at U",
805
+ "score": 0.3906,
806
+ "source": "pentatonic-memory",
807
+ "doc_id": "sku-atlas-phone-01"
808
+ }
809
+ ],
810
+ "correct": false,
811
+ "score": 0.5,
812
+ "grading_notes": "judge=0.50 \u2014 The answer mentions the Pentatonic Crew Tee Black and Sage as being made from organic cotton with low-impact reactive dy",
813
+ "search_time_ms": 444.13008002447896,
814
+ "generation_time_ms": 0.0,
815
+ "tokens_in": 0,
816
+ "tokens_out": 0,
817
+ "retrieval_tokens": 404,
818
+ "query_tokens": 11,
819
+ "context_tokens": 393,
820
+ "judge_tokens_in": 701,
821
+ "judge_tokens_out": 50,
822
+ "judge_latency_ms": 1114.83097499609
823
+ },
824
+ {
825
+ "task_id": "rubric-cc-certified-items",
826
+ "query": "Do any items in the catalogue have Cradle to Cradle certification?",
827
+ "answer": "# Atlas Phone Shell \u2014 SKU ATL-PHN-001\n\n**Brand:** Atlas Circular\n**Category:** Mobile accessories / Phone cases\n**Compatible with:** iPhone 15, iPhone 15 Pro\n\n**Material composition:**\n- 68% recycled ocean-bound polypropylene\n- 24% recycled polycarbonate (post-consumer)\n- 8% natural calcium carbonate\n\n**Price:** \u00a329.00 GBP (standard) / \u00a324.00 (subscription)\n**Inventory:** 1,240 units in stock at UK fulfilment (Worthing DC)\n**Take-back:** Yes \u2014 returnable for 50% credit after 18 months\n**Certific\n---\n# Pentatonic Crew Tee Black \u2014 SKU PTT-TEE-BLK\n\n**Brand:** Pentatonic\n**Category:** Apparel / T-shirts\n**Fit:** Unisex regular\n**Size range:** XS, S, M, L, XL, XXL\n\n**Material composition:**\n- 100% GOTS-certified organic cotton, 180 gsm\n- Dyeing: low-impact reactive dye, closed-loop water system\n\n**Price:** \u00a328.00 GBP\n**Inventory:** S=48, M=136, L=94, XL=22, XS=0 (discontinued), XXL=0 (discontinued)\n**Country of origin:** Portugal (CITEVE-certified mill)\n**Care:** Wash cold, line dry; no tumble d",
828
+ "hits": [
829
+ {
830
+ "text": "# Atlas Phone Shell \u2014 SKU ATL-PHN-001\n\n**Brand:** Atlas Circular\n**Category:** Mobile accessories / Phone cases\n**Compatible with:** iPhone 15, iPhone 15 Pro\n\n**Material composition:**\n- 68% recycled ocean-bound polypropylene\n- 24% recycled polycarbonate (post-consumer)\n- 8% natural calcium carbonate\n\n**Price:** \u00a329.00 GBP (standard) / \u00a324.00 (subscription)\n**Inventory:** 1,240 units in stock at U",
831
+ "score": 0.4032,
832
+ "source": "pentatonic-memory",
833
+ "doc_id": "sku-atlas-phone-01"
834
+ },
835
+ {
836
+ "text": "# Pentatonic Crew Tee Black \u2014 SKU PTT-TEE-BLK\n\n**Brand:** Pentatonic\n**Category:** Apparel / T-shirts\n**Fit:** Unisex regular\n**Size range:** XS, S, M, L, XL, XXL\n\n**Material composition:**\n- 100% GOTS-certified organic cotton, 180 gsm\n- Dyeing: low-impact reactive dye, closed-loop water system\n\n**Price:** \u00a328.00 GBP\n**Inventory:** S=48, M=136, L=94, XL=22, XS=0 (discontinued), XXL=0 (discontinued",
837
+ "score": 0.3788,
838
+ "source": "pentatonic-memory",
839
+ "doc_id": "sku-cotton-tee-black"
840
+ }
841
+ ],
842
+ "correct": true,
843
+ "score": 1.0,
844
+ "grading_notes": "judge=1.00 \u2014 The Atlas Phone Shell is named with Cradle to Cradle Bronze certification.",
845
+ "search_time_ms": 461.1902699980419,
846
+ "generation_time_ms": 0.0,
847
+ "tokens_in": 0,
848
+ "tokens_out": 0,
849
+ "retrieval_tokens": 314,
850
+ "query_tokens": 14,
851
+ "context_tokens": 300,
852
+ "judge_tokens_in": 589,
853
+ "judge_tokens_out": 29,
854
+ "judge_latency_ms": 567.9309439957142
855
+ },
856
+ {
857
+ "task_id": "entity-recycled-content-high",
858
+ "query": "Which items in the catalogue use at least 50% recycled material?",
859
+ "answer": "# Atlas Phone Shell \u2014 SKU ATL-PHN-001\n\n**Brand:** Atlas Circular\n**Category:** Mobile accessories / Phone cases\n**Compatible with:** iPhone 15, iPhone 15 Pro\n\n**Material composition:**\n- 68% recycled ocean-bound polypropylene\n- 24% recycled polycarbonate (post-consumer)\n- 8% natural calcium carbonate\n\n**Price:** \u00a329.00 GBP (standard) / \u00a324.00 (subscription)\n**Inventory:** 1,240 units in stock at UK fulfilment (Worthing DC)\n**Take-back:** Yes \u2014 returnable for 50% credit after 18 months\n**Certific",
860
+ "hits": [
861
+ {
862
+ "text": "# Atlas Phone Shell \u2014 SKU ATL-PHN-001\n\n**Brand:** Atlas Circular\n**Category:** Mobile accessories / Phone cases\n**Compatible with:** iPhone 15, iPhone 15 Pro\n\n**Material composition:**\n- 68% recycled ocean-bound polypropylene\n- 24% recycled polycarbonate (post-consumer)\n- 8% natural calcium carbonate\n\n**Price:** \u00a329.00 GBP (standard) / \u00a324.00 (subscription)\n**Inventory:** 1,240 units in stock at U",
863
+ "score": 0.3968,
864
+ "source": "pentatonic-memory",
865
+ "doc_id": "sku-atlas-phone-01"
866
+ }
867
+ ],
868
+ "correct": false,
869
+ "score": 0.0,
870
+ "grading_notes": "no expected_substrings set",
871
+ "search_time_ms": 489.93708699708804,
872
+ "generation_time_ms": 0.0,
873
+ "tokens_in": 0,
874
+ "tokens_out": 0,
875
+ "retrieval_tokens": 151,
876
+ "query_tokens": 14,
877
+ "context_tokens": 137,
878
+ "judge_tokens_in": 0,
879
+ "judge_tokens_out": 0,
880
+ "judge_latency_ms": 0.0
881
+ }
882
+ ]
883
+ }