Few-shot Benchmark Report

Run ID: 20260505T181843Z | Generated UTC: 2026-05-05T18:21:48.786233+00:00

Configuration

{
  "models": [
    "opus-4-5",
    "opus-4-6",
    "sonnet-4-5",
    "sonnet-4-6"
  ],
  "fewshot_strategies": [
    "db_only",
    "db_plus_raw",
    "raw_only",
    "zero_shot"
  ],
  "chat_count": 21,
  "runs_per_chat": 1,
  "max_workers": 15,
  "raw_fewshot_count": 26,
  "raw_fewshot_labels_filter": []
}

Model + Strategy Summary

ModelStrategyRunsSuccess rateAvg attempts Avg elapsed (s)Avg mismatch/expected runField match rate
opus-4-5db_only211.00001.00008.54337.61900.6825
opus-4-5db_plus_raw211.00001.00008.44248.66670.6546
opus-4-5raw_only211.00001.000018.74468.23810.6717
opus-4-5zero_shot211.00001.00007.27987.00000.7474
opus-4-6db_only211.00001.00007.86299.23810.6572
opus-4-6db_plus_raw211.00001.00008.70178.52380.6603
opus-4-6raw_only211.00001.00006.44858.00000.6812
opus-4-6zero_shot211.00001.00005.67406.14290.8045
sonnet-4-5db_only211.00001.00007.79867.71430.6867
sonnet-4-5db_plus_raw211.00001.00007.97577.95240.6687
sonnet-4-5raw_only211.00001.00007.09878.71430.6528
sonnet-4-5zero_shot211.00001.00006.06588.80950.7082
sonnet-4-6db_only211.00001.00006.97709.61900.6167
sonnet-4-6db_plus_raw211.00001.00009.50878.85710.6471
sonnet-4-6raw_only211.00001.00006.53418.38100.6660
sonnet-4-6zero_shot211.00001.00006.36808.61900.6943

Per-chat Breakdown

ChatModelStrategyRuns Success rateAvg elapsed (s)Mismatch counts
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-5db_only11.00007.7978[15]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-5db_plus_raw11.00007.0853[15]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-5raw_only11.000024.1299[15]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-5zero_shot11.00005.8588[15]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-6db_only11.00006.4233[15]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-6db_plus_raw11.00007.0704[15]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-6raw_only11.00004.9494[14]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-6zero_shot11.00004.9043[15]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-5db_only11.00007.7478[15]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-5db_plus_raw11.00006.7182[14]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-5raw_only11.00005.3144[13]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-5zero_shot11.00005.2814[15]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-6db_only11.00005.4053[15]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-6db_plus_raw11.000011.9693[15]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-6raw_only11.00004.9705[16]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-6zero_shot11.00004.4847[15]
02__2026-02-09__120363426578757754_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-5db_only11.00007.5812[14]
02__2026-02-09__120363426578757754_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-5db_plus_raw11.00006.3277[15]
02__2026-02-09__120363426578757754_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-5raw_only11.000036.8433[14]
02__2026-02-09__120363426578757754_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-5zero_shot11.00005.5772[14]
02__2026-02-09__120363426578757754_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-6db_only11.00006.8242[15]
02__2026-02-09__120363426578757754_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-6db_plus_raw11.00007.0935[14]
02__2026-02-09__120363426578757754_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-6raw_only11.00005.0888[14]
02__2026-02-09__120363426578757754_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-6zero_shot11.00004.8696[14]
02__2026-02-09__120363426578757754_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-5db_only11.00006.5448[14]
02__2026-02-09__120363426578757754_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-5db_plus_raw11.00006.2405[14]
02__2026-02-09__120363426578757754_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-5raw_only11.00005.0286[13]
02__2026-02-09__120363426578757754_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-5zero_shot11.00005.7057[14]
02__2026-02-09__120363426578757754_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-6db_only11.00008.1873[14]
02__2026-02-09__120363426578757754_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-6db_plus_raw11.000013.1192[15]
02__2026-02-09__120363426578757754_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-6raw_only11.00006.4834[15]
02__2026-02-09__120363426578757754_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-6zero_shot11.00009.7462[15]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-5db_only11.000010.2789[17]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-5db_plus_raw11.00008.4137[17]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-5raw_only11.000016.2404[17]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-5zero_shot11.00009.2448[17]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-6db_only11.00008.8351[16]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-6db_plus_raw11.000010.5065[17]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-6raw_only11.00008.9427[17]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-6zero_shot11.00006.9384[16]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-5db_only11.000010.6220[17]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-5db_plus_raw11.000011.3037[17]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-5raw_only11.00009.1418[16]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-5zero_shot11.00008.8018[17]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-6db_only11.00008.3721[17]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-6db_plus_raw11.000010.7353[17]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-6raw_only11.00009.1441[18]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-6zero_shot11.00006.6795[16]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonopus-4-5db_only11.00006.0217[14]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonopus-4-5db_plus_raw11.00006.5016[14]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonopus-4-5raw_only11.00005.6084[14]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonopus-4-5zero_shot11.00004.8310[15]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonopus-4-6db_only11.00006.6959[15]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonopus-4-6db_plus_raw11.00006.9577[14]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonopus-4-6raw_only11.00005.1176[14]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonopus-4-6zero_shot11.00005.0645[15]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonsonnet-4-5db_only11.00008.6198[14]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonsonnet-4-5db_plus_raw11.00006.7137[14]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonsonnet-4-5raw_only11.00005.4114[12]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonsonnet-4-5zero_shot11.00004.8157[16]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonsonnet-4-6db_only11.00006.1352[14]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonsonnet-4-6db_plus_raw11.000018.4370[15]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonsonnet-4-6raw_only11.00005.3292[13]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonsonnet-4-6zero_shot11.00004.3817[18]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-5db_only11.00006.9010[14]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-5db_plus_raw11.00006.2877[15]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-5raw_only11.00005.7034[15]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-5zero_shot11.00005.0730[14]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-6db_only11.00007.4538[13]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-6db_plus_raw11.00008.8038[14]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-6raw_only11.00005.5405[15]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-6zero_shot11.00005.0031[13]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-5db_only11.00007.4256[14]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-5db_plus_raw11.00006.7737[14]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-5raw_only11.00005.2603[12]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-5zero_shot11.00005.3230[13]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-6db_only11.00005.6681[14]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-6db_plus_raw11.00006.3477[15]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-6raw_only11.00005.1549[15]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-6zero_shot11.00004.6234[14]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-5db_only11.00006.7210[14]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-5db_plus_raw11.00006.7340[14]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-5raw_only11.00005.4206[14]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-5zero_shot11.00004.9127[14]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-6db_only11.00006.5684[14]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-6db_plus_raw11.00006.9537[14]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-6raw_only11.00005.2512[13]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-6zero_shot11.00004.8988[14]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-5db_only11.00006.0317[14]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-5db_plus_raw11.00006.0662[13]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-5raw_only11.00005.0284[13]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-5zero_shot11.00005.1464[14]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-6db_only11.00005.6211[14]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-6db_plus_raw11.00009.9350[14]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-6raw_only11.00004.8295[13]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-6zero_shot11.00004.5296[13]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-5db_only11.00006.2858[1]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-5db_plus_raw11.00006.5685[17]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-5raw_only11.00004.4782[17]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-5zero_shot11.00002.5649[1]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-6db_only11.00006.1288[17]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-6db_plus_raw11.00008.9531[19]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-6raw_only11.00004.6804[17]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-6zero_shot11.00002.5292[1]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-5db_only11.00004.4219[1]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-5db_plus_raw11.00005.6431[1]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-5raw_only11.00005.0054[17]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-5zero_shot11.00003.0747[1]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-6db_only11.00004.7528[17]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-6db_plus_raw11.00006.3440[17]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-6raw_only11.00004.2338[17]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-6zero_shot11.00003.9791[17]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-5db_only11.00006.3090[17]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-5db_plus_raw11.00006.6022[17]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-5raw_only11.00005.6837[10]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-5zero_shot11.00005.2415[14]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-6db_only11.00008.2271[20]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-6db_plus_raw11.00007.0444[15]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-6raw_only11.00005.7848[11]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-6zero_shot11.00005.3247[12]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-5db_only11.00006.7570[15]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-5db_plus_raw11.00006.4338[16]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-5raw_only11.00008.2128[11]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-5zero_shot11.00005.3753[19]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-6db_only11.00005.9355[17]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-6db_plus_raw11.00007.1856[15]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-6raw_only11.00005.3204[11]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-6zero_shot11.00005.6384[15]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-5db_only11.00006.5105[15]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-5db_plus_raw11.000026.7842[15]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-5raw_only11.00006.4909[10]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-5zero_shot11.00005.2616[12]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-6db_only11.00008.0422[20]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-6db_plus_raw11.000010.7803[15]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-6raw_only11.00005.5738[11]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-6zero_shot11.00005.2122[10]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-5db_only11.00006.2280[15]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-5db_plus_raw11.00006.8198[15]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-5raw_only11.00007.9559[10]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-5zero_shot11.00005.5881[17]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-6db_only11.00005.5759[16]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-6db_plus_raw11.00006.3609[15]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-6raw_only11.00006.2904[11]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-6zero_shot11.00005.0627[13]
multiple_product_multiple_shipment_complex.jsonopus-4-5db_only11.000016.0715[5]
multiple_product_multiple_shipment_complex.jsonopus-4-5db_plus_raw11.000011.3479[6]
multiple_product_multiple_shipment_complex.jsonopus-4-5raw_only11.000012.9087[7]
multiple_product_multiple_shipment_complex.jsonopus-4-5zero_shot11.000012.6850[4]
multiple_product_multiple_shipment_complex.jsonopus-4-6db_only11.000013.2585[5]
multiple_product_multiple_shipment_complex.jsonopus-4-6db_plus_raw11.000012.6782[6]
multiple_product_multiple_shipment_complex.jsonopus-4-6raw_only11.000010.9548[5]
multiple_product_multiple_shipment_complex.jsonopus-4-6zero_shot11.00009.5077[0]
multiple_product_multiple_shipment_complex.jsonsonnet-4-5db_only11.000012.5446[6]
multiple_product_multiple_shipment_complex.jsonsonnet-4-5db_plus_raw11.000012.4740[6]
multiple_product_multiple_shipment_complex.jsonsonnet-4-5raw_only11.000012.6567[7]
multiple_product_multiple_shipment_complex.jsonsonnet-4-5zero_shot11.00009.7879[21]
multiple_product_multiple_shipment_complex.jsonsonnet-4-6db_only11.000010.5450[5]
multiple_product_multiple_shipment_complex.jsonsonnet-4-6db_plus_raw11.000013.4019[7]
multiple_product_multiple_shipment_complex.jsonsonnet-4-6raw_only11.000011.1374[5]
multiple_product_multiple_shipment_complex.jsonsonnet-4-6zero_shot11.000011.3678[7]
multiple_product_multiple_shipment_medium.jsonopus-4-5db_only11.000010.3140[7]
multiple_product_multiple_shipment_medium.jsonopus-4-5db_plus_raw11.000010.4044[8]
multiple_product_multiple_shipment_medium.jsonopus-4-5raw_only11.000034.8145[8]
multiple_product_multiple_shipment_medium.jsonopus-4-5zero_shot11.00007.8371[7]
multiple_product_multiple_shipment_medium.jsonopus-4-6db_only11.00009.2891[7]
multiple_product_multiple_shipment_medium.jsonopus-4-6db_plus_raw11.000010.5483[7]
multiple_product_multiple_shipment_medium.jsonopus-4-6raw_only11.00008.4393[8]
multiple_product_multiple_shipment_medium.jsonopus-4-6zero_shot11.00006.6737[0]
multiple_product_multiple_shipment_medium.jsonsonnet-4-5db_only11.00008.7758[7]
multiple_product_multiple_shipment_medium.jsonsonnet-4-5db_plus_raw11.00009.9930[7]
multiple_product_multiple_shipment_medium.jsonsonnet-4-5raw_only11.00008.7901[9]
multiple_product_multiple_shipment_medium.jsonsonnet-4-5zero_shot11.00007.8483[8]
multiple_product_multiple_shipment_medium.jsonsonnet-4-6db_only11.00008.9151[7]
multiple_product_multiple_shipment_medium.jsonsonnet-4-6db_plus_raw11.00009.5254[7]
multiple_product_multiple_shipment_medium.jsonsonnet-4-6raw_only11.00007.9204[7]
multiple_product_multiple_shipment_medium.jsonsonnet-4-6zero_shot11.00007.5363[7]
multiple_product_multiple_shipment_simple.jsonopus-4-5db_only11.00009.0913[3]
multiple_product_multiple_shipment_simple.jsonopus-4-5db_plus_raw11.00008.9143[3]
multiple_product_multiple_shipment_simple.jsonopus-4-5raw_only11.000025.9565[4]
multiple_product_multiple_shipment_simple.jsonopus-4-5zero_shot11.000010.6499[6]
multiple_product_multiple_shipment_simple.jsonopus-4-6db_only11.00007.5350[5]
multiple_product_multiple_shipment_simple.jsonopus-4-6db_plus_raw11.00008.9789[5]
multiple_product_multiple_shipment_simple.jsonopus-4-6raw_only11.00007.8721[4]
multiple_product_multiple_shipment_simple.jsonopus-4-6zero_shot11.00006.1409[6]
multiple_product_multiple_shipment_simple.jsonsonnet-4-5db_only11.00007.6163[1]
multiple_product_multiple_shipment_simple.jsonsonnet-4-5db_plus_raw11.00008.3078[5]
multiple_product_multiple_shipment_simple.jsonsonnet-4-5raw_only11.00008.0564[6]
multiple_product_multiple_shipment_simple.jsonsonnet-4-5zero_shot11.00005.9383[7]
multiple_product_multiple_shipment_simple.jsonsonnet-4-6db_only11.00007.8850[6]
multiple_product_multiple_shipment_simple.jsonsonnet-4-6db_plus_raw11.00008.3081[3]
multiple_product_multiple_shipment_simple.jsonsonnet-4-6raw_only11.00006.8336[3]
multiple_product_multiple_shipment_simple.jsonsonnet-4-6zero_shot11.00008.1147[7]
real_world_msgs_test_v1.jsonopus-4-5db_only11.00008.3186[0]
real_world_msgs_test_v1.jsonopus-4-5db_plus_raw11.00006.9379[1]
real_world_msgs_test_v1.jsonopus-4-5raw_only11.000025.9336[1]
real_world_msgs_test_v1.jsonopus-4-5zero_shot11.00005.9894[0]
real_world_msgs_test_v1.jsonopus-4-6db_only11.00006.2971[0]
real_world_msgs_test_v1.jsonopus-4-6db_plus_raw11.00006.8210[0]
real_world_msgs_test_v1.jsonopus-4-6raw_only11.00005.3569[1]
real_world_msgs_test_v1.jsonopus-4-6zero_shot11.00005.0713[3]
real_world_msgs_test_v1.jsonsonnet-4-5db_only11.00007.8192[3]
real_world_msgs_test_v1.jsonsonnet-4-5db_plus_raw11.00009.0627[3]
real_world_msgs_test_v1.jsonsonnet-4-5raw_only11.00007.9241[4]
real_world_msgs_test_v1.jsonsonnet-4-5zero_shot11.00006.1579[3]
real_world_msgs_test_v1.jsonsonnet-4-6db_only11.00007.8122[3]
real_world_msgs_test_v1.jsonsonnet-4-6db_plus_raw11.00007.3667[3]
real_world_msgs_test_v1.jsonsonnet-4-6raw_only11.00005.1861[4]
real_world_msgs_test_v1.jsonsonnet-4-6zero_shot11.00005.3736[6]
real_world_msgs_test_v2.jsonopus-4-5db_only11.00008.3792[4]
real_world_msgs_test_v2.jsonopus-4-5db_plus_raw11.00007.0715[4]
real_world_msgs_test_v2.jsonopus-4-5raw_only11.000022.9605[5]
real_world_msgs_test_v2.jsonopus-4-5zero_shot11.000012.2644[4]
real_world_msgs_test_v2.jsonopus-4-6db_only11.00007.8168[4]
real_world_msgs_test_v2.jsonopus-4-6db_plus_raw11.00008.2556[4]
real_world_msgs_test_v2.jsonopus-4-6raw_only11.00007.0224[5]
real_world_msgs_test_v2.jsonopus-4-6zero_shot11.00006.5707[1]
real_world_msgs_test_v2.jsonsonnet-4-5db_only11.00007.3369[4]
real_world_msgs_test_v2.jsonsonnet-4-5db_plus_raw11.00007.6004[6]
real_world_msgs_test_v2.jsonsonnet-4-5raw_only11.00007.7079[10]
real_world_msgs_test_v2.jsonsonnet-4-5zero_shot11.00006.7791[4]
real_world_msgs_test_v2.jsonsonnet-4-6db_only11.00007.4030[6]
real_world_msgs_test_v2.jsonsonnet-4-6db_plus_raw11.00007.3668[6]
real_world_msgs_test_v2.jsonsonnet-4-6raw_only11.00007.3119[6]
real_world_msgs_test_v2.jsonsonnet-4-6zero_shot11.00008.3625[3]
real_world_msgs_test_v3.jsonopus-4-5db_only11.00008.6902[3]
real_world_msgs_test_v3.jsonopus-4-5db_plus_raw11.00007.0972[3]
real_world_msgs_test_v3.jsonopus-4-5raw_only11.000023.7314[3]
real_world_msgs_test_v3.jsonopus-4-5zero_shot11.000010.7949[0]
real_world_msgs_test_v3.jsonopus-4-6db_only11.00009.1579[3]
real_world_msgs_test_v3.jsonopus-4-6db_plus_raw11.00008.4501[3]
real_world_msgs_test_v3.jsonopus-4-6raw_only11.00006.7960[3]
real_world_msgs_test_v3.jsonopus-4-6zero_shot11.00006.3371[3]
real_world_msgs_test_v3.jsonsonnet-4-5db_only11.00007.9646[3]
real_world_msgs_test_v3.jsonsonnet-4-5db_plus_raw11.00009.1159[3]
real_world_msgs_test_v3.jsonsonnet-4-5raw_only11.00008.4864[6]
real_world_msgs_test_v3.jsonsonnet-4-5zero_shot11.00005.5904[0]
real_world_msgs_test_v3.jsonsonnet-4-6db_only11.00006.9338[3]
real_world_msgs_test_v3.jsonsonnet-4-6db_plus_raw11.00008.4382[3]
real_world_msgs_test_v3.jsonsonnet-4-6raw_only11.00007.1819[3]
real_world_msgs_test_v3.jsonsonnet-4-6zero_shot11.00006.2591[4]
single_product_multiple_shipment_complex.jsonopus-4-5db_only11.000010.8782[4]
single_product_multiple_shipment_complex.jsonopus-4-5db_plus_raw11.00008.9548[5]
single_product_multiple_shipment_complex.jsonopus-4-5raw_only11.000027.7049[5]
single_product_multiple_shipment_complex.jsonopus-4-5zero_shot11.00009.9238[0]
single_product_multiple_shipment_complex.jsonopus-4-6db_only11.00008.8681[1]
single_product_multiple_shipment_complex.jsonopus-4-6db_plus_raw11.000010.3277[4]
single_product_multiple_shipment_complex.jsonopus-4-6raw_only11.00008.6917[3]
single_product_multiple_shipment_complex.jsonopus-4-6zero_shot11.00007.1207[0]
single_product_multiple_shipment_complex.jsonsonnet-4-5db_only11.000010.3388[4]
single_product_multiple_shipment_complex.jsonsonnet-4-5db_plus_raw11.000012.2838[4]
single_product_multiple_shipment_complex.jsonsonnet-4-5raw_only11.00009.9719[6]
single_product_multiple_shipment_complex.jsonsonnet-4-5zero_shot11.00007.4448[1]
single_product_multiple_shipment_complex.jsonsonnet-4-6db_only11.00008.8977[4]
single_product_multiple_shipment_complex.jsonsonnet-4-6db_plus_raw11.000011.9766[4]
single_product_multiple_shipment_complex.jsonsonnet-4-6raw_only11.00009.6924[4]
single_product_multiple_shipment_complex.jsonsonnet-4-6zero_shot11.00007.5174[0]
single_product_multiple_shipment_medium.jsonopus-4-5db_only11.00009.0966[3]
single_product_multiple_shipment_medium.jsonopus-4-5db_plus_raw11.00008.5394[3]
single_product_multiple_shipment_medium.jsonopus-4-5raw_only11.000022.3543[3]
single_product_multiple_shipment_medium.jsonopus-4-5zero_shot11.00009.1793[1]
single_product_multiple_shipment_medium.jsonopus-4-6db_only11.00008.4056[2]
single_product_multiple_shipment_medium.jsonopus-4-6db_plus_raw11.000010.3520[3]
single_product_multiple_shipment_medium.jsonopus-4-6raw_only11.00006.9889[3]
single_product_multiple_shipment_medium.jsonopus-4-6zero_shot11.00006.0001[0]
single_product_multiple_shipment_medium.jsonsonnet-4-5db_only11.00009.4677[3]
single_product_multiple_shipment_medium.jsonsonnet-4-5db_plus_raw11.00007.8498[3]
single_product_multiple_shipment_medium.jsonsonnet-4-5raw_only11.00007.2117[5]
single_product_multiple_shipment_medium.jsonsonnet-4-5zero_shot11.00006.6741[1]
single_product_multiple_shipment_medium.jsonsonnet-4-6db_only11.00006.6728[3]
single_product_multiple_shipment_medium.jsonsonnet-4-6db_plus_raw11.00008.3305[3]
single_product_multiple_shipment_medium.jsonsonnet-4-6raw_only11.00006.6118[3]
single_product_multiple_shipment_medium.jsonsonnet-4-6zero_shot11.00007.4008[4]
single_product_multiple_shipment_simple.jsonopus-4-5db_only11.00009.0824[3]
single_product_multiple_shipment_simple.jsonopus-4-5db_plus_raw11.00007.5320[3]
single_product_multiple_shipment_simple.jsonopus-4-5raw_only11.000028.1662[4]
single_product_multiple_shipment_simple.jsonopus-4-5zero_shot11.00007.4948[4]
single_product_multiple_shipment_simple.jsonopus-4-6db_only11.00008.3154[13]
single_product_multiple_shipment_simple.jsonopus-4-6db_plus_raw11.000010.2154[3]
single_product_multiple_shipment_simple.jsonopus-4-6raw_only11.00006.8777[3]
single_product_multiple_shipment_simple.jsonopus-4-6zero_shot11.00005.9368[1]
single_product_multiple_shipment_simple.jsonsonnet-4-5db_only11.00008.0143[3]
single_product_multiple_shipment_simple.jsonsonnet-4-5db_plus_raw11.00008.5885[3]
single_product_multiple_shipment_simple.jsonsonnet-4-5raw_only11.00006.7301[3]
single_product_multiple_shipment_simple.jsonsonnet-4-5zero_shot11.00005.9569[1]
single_product_multiple_shipment_simple.jsonsonnet-4-6db_only11.00007.0443[3]
single_product_multiple_shipment_simple.jsonsonnet-4-6db_plus_raw11.000010.1632[3]
single_product_multiple_shipment_simple.jsonsonnet-4-6raw_only11.00007.6634[3]
single_product_multiple_shipment_simple.jsonsonnet-4-6zero_shot11.00005.6089[0]
single_product_single_shipment_complex.jsonopus-4-5db_only11.00008.2430[4]
single_product_single_shipment_complex.jsonopus-4-5db_plus_raw11.00006.4775[4]
single_product_single_shipment_complex.jsonopus-4-5raw_only11.000020.3950[5]
single_product_single_shipment_complex.jsonopus-4-5zero_shot11.00006.9078[4]
single_product_single_shipment_complex.jsonopus-4-6db_only11.00006.7621[5]
single_product_single_shipment_complex.jsonopus-4-6db_plus_raw11.00007.6525[4]
single_product_single_shipment_complex.jsonopus-4-6raw_only11.00005.6598[4]
single_product_single_shipment_complex.jsonopus-4-6zero_shot11.00005.1428[4]
single_product_single_shipment_complex.jsonsonnet-4-5db_only11.00006.4033[6]
single_product_single_shipment_complex.jsonsonnet-4-5db_plus_raw11.00006.5115[6]
single_product_single_shipment_complex.jsonsonnet-4-5raw_only11.00005.6168[8]
single_product_single_shipment_complex.jsonsonnet-4-5zero_shot11.00005.7477[6]
single_product_single_shipment_complex.jsonsonnet-4-6db_only11.00006.6317[6]
single_product_single_shipment_complex.jsonsonnet-4-6db_plus_raw11.00007.1440[6]
single_product_single_shipment_complex.jsonsonnet-4-6raw_only11.00005.9534[6]
single_product_single_shipment_complex.jsonsonnet-4-6zero_shot11.00007.5932[4]
single_product_single_shipment_medium.jsonopus-4-5db_only11.00008.6304[3]
single_product_single_shipment_medium.jsonopus-4-5db_plus_raw11.00006.2610[3]
single_product_single_shipment_medium.jsonopus-4-5raw_only11.000019.5976[2]
single_product_single_shipment_medium.jsonopus-4-5zero_shot11.00004.9974[1]
single_product_single_shipment_medium.jsonopus-4-6db_only11.00007.8182[4]
single_product_single_shipment_medium.jsonopus-4-6db_plus_raw11.00007.0910[3]
single_product_single_shipment_medium.jsonopus-4-6raw_only11.00005.0971[3]
single_product_single_shipment_medium.jsonopus-4-6zero_shot11.00005.2821[1]
single_product_single_shipment_medium.jsonsonnet-4-5db_only11.00006.6754[3]
single_product_single_shipment_medium.jsonsonnet-4-5db_plus_raw11.00006.8331[3]
single_product_single_shipment_medium.jsonsonnet-4-5raw_only11.00005.0267[2]
single_product_single_shipment_medium.jsonsonnet-4-5zero_shot11.00005.3599[4]
single_product_single_shipment_medium.jsonsonnet-4-6db_only11.00006.2800[3]
single_product_single_shipment_medium.jsonsonnet-4-6db_plus_raw11.00009.1710[3]
single_product_single_shipment_medium.jsonsonnet-4-6raw_only11.00005.2559[3]
single_product_single_shipment_medium.jsonsonnet-4-6zero_shot11.00004.6565[3]
single_product_single_shipment_simple.jsonopus-4-5db_only11.00008.2063[0]
single_product_single_shipment_simple.jsonopus-4-5db_plus_raw11.00006.4471[0]
single_product_single_shipment_simple.jsonopus-4-5raw_only11.000018.5153[0]
single_product_single_shipment_simple.jsonopus-4-5zero_shot11.00005.5874[0]
single_product_single_shipment_simple.jsonopus-4-6db_only11.00006.3977[0]
single_product_single_shipment_simple.jsonopus-4-6db_plus_raw11.00007.2009[0]
single_product_single_shipment_simple.jsonopus-4-6raw_only11.00004.7336[0]
single_product_single_shipment_simple.jsonopus-4-6zero_shot11.00004.6261[0]
single_product_single_shipment_simple.jsonsonnet-4-5db_only11.00006.4154[0]
single_product_single_shipment_simple.jsonsonnet-4-5db_plus_raw11.00006.1572[0]
single_product_single_shipment_simple.jsonsonnet-4-5raw_only11.00004.5352[0]
single_product_single_shipment_simple.jsonsonnet-4-5zero_shot11.00004.9849[3]
single_product_single_shipment_simple.jsonsonnet-4-6db_only11.00005.8431[15]
single_product_single_shipment_simple.jsonsonnet-4-6db_plus_raw11.00008.0557[0]
single_product_single_shipment_simple.jsonsonnet-4-6raw_only11.00004.7110[0]
single_product_single_shipment_simple.jsonsonnet-4-6zero_shot11.00004.8118[0]

Top Mismatches (up to 100 runs)

ChatModelStrategyRunMismatch countSample mismatches
multiple_product_multiple_shipment_complex.jsonsonnet-4-5zero_shot121
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 300.0,
    "actual": 276.0
  },
  {
    "path": "data[0].items[1].quantity_unit",
    "expected": "boxes",
    "actual": "BOXES"
  },
  {
    "path": "data[0].items[1].unit_price",
    "expected": 12.0,
    "actual": 11.04
  }
]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-6db_only120
[
  {
    "path": "data",
    "expected_len": 1,
    "actual_len": 2
  },
  {
    "path": "data[0].items[0].description",
    "expected": "TG - BP102",
    "actual": "lecithin fat powder"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 23000.0,
    "actual": 8.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 1410.0,
    "actual": 12.0
  }
]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-6db_only120
[
  {
    "path": "data",
    "expected_len": 1,
    "actual_len": 2
  },
  {
    "path": "data[0].items[0].description",
    "expected": "TG - BP102",
    "actual": "lecithin fat powder"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 46000.0,
    "actual": 8.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 1410.0,
    "actual": 12.0
  }
]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-5zero_shot119
[
  {
    "path": "data[0].items[0].description",
    "expected": "TG - BP102",
    "actual": "BP102"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 46000.0,
    "actual": 23.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Busan"
  }
]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-6db_plus_raw119
[
  {
    "path": "data",
    "expected_len": 1,
    "actual_len": 2
  },
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": "lecithin fat powder"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 10500.0,
    "actual": 8.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3100.0,
    "actual": 12.0
  }
]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonsonnet-4-6zero_shot118
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 9000.0,
    "actual": 9.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3.25,
    "actual": 3250.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/KG",
    "actual": "USD/MT"
  }
]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-6raw_only118
[
  {
    "path": "data",
    "expected_len": 1,
    "actual_len": 3
  },
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": "Bergapur"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 6300.0,
    "actual": 10.5
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3050.0,
    "actual": 3.05
  }
]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-5zero_shot117
[
  {
    "path": "data[0].items[0].description",
    "expected": "TG - BP102",
    "actual": "BP102"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 23000.0,
    "actual": 23.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Busan"
  }
]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-6db_only117
[
  {
    "path": "data[0].items[0].description",
    "expected": "TG - BP102",
    "actual": "BP102"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 46000.0,
    "actual": 23.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Busan"
  }
]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-5db_plus_raw117
[
  {
    "path": "data[0].items[0].description",
    "expected": "TG - BP102",
    "actual": "BP102"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 46000.0,
    "actual": 23.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Busan"
  }
]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-5db_only117
[
  {
    "path": "data[0].items[0].description",
    "expected": "TG - BP102",
    "actual": "BP102"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 46000.0,
    "actual": 23.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Busan"
  }
]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-6zero_shot117
[
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": ""
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 10500.0,
    "actual": 10.5
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3100.0,
    "actual": null
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": ""
  }
]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-6raw_only117
[
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": ""
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 10500.0,
    "actual": 10.5
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3100.0,
    "actual": null
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": ""
  }
]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-6db_plus_raw117
[
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": ""
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 10500.0,
    "actual": 10.5
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3100.0,
    "actual": null
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": ""
  }
]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-6db_only117
[
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": ""
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 10500.0,
    "actual": 10.5
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3100.0,
    "actual": null
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": ""
  }
]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-5raw_only117
[
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": ""
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 10500.0,
    "actual": 10.5
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3100.0,
    "actual": null
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": ""
  }
]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-6raw_only117
[
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": ""
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 10500.0,
    "actual": 10.5
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3100.0,
    "actual": null
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": ""
  }
]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-6db_only117
[
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": ""
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 10500.0,
    "actual": 10.5
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3100.0,
    "actual": null
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": ""
  }
]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-5raw_only117
[
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": ""
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 10500.0,
    "actual": 10.5
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3100.0,
    "actual": null
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": ""
  }
]
07__2025-12-23__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-5db_plus_raw117
[
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": ""
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 10500.0,
    "actual": 10.5
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3100.0,
    "actual": null
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": ""
  }
]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-6db_plus_raw117
[
  {
    "path": "data",
    "expected_len": 1,
    "actual_len": 3
  },
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": "Bergapur"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 6300.0,
    "actual": 10.5
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3050.0,
    "actual": 3.05
  }
]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-6db_only117
[
  {
    "path": "data",
    "expected_len": 1,
    "actual_len": 3
  },
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": "Bergapur"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 6300.0,
    "actual": 10.5
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3050.0,
    "actual": 3.05
  }
]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-5zero_shot117
[
  {
    "path": "data",
    "expected_len": 1,
    "actual_len": 3
  },
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": "Bergapur"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 6300.0,
    "actual": 10.5
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3050.0,
    "actual": 3.05
  }
]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-5db_plus_raw117
[
  {
    "path": "data",
    "expected_len": 1,
    "actual_len": 3
  },
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": "Bergapur"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 6300.0,
    "actual": 10500.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "KG"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3050.0,
    "actual": 3.05
  }
]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-5db_only117
[
  {
    "path": "data",
    "expected_len": 1,
    "actual_len": 3
  },
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": "Bergapur"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 6300.0,
    "actual": 10.5
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3050.0,
    "actual": 3.05
  }
]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-6raw_only117
[
  {
    "path": "data",
    "expected_len": 1,
    "actual_len": 3
  },
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": "Bergapur"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 6300.0,
    "actual": 10500.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "KG"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3050.0,
    "actual": 3.05
  }
]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-6db_plus_raw117
[
  {
    "path": "data",
    "expected_len": 1,
    "actual_len": 3
  },
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": "Bergapur"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 6300.0,
    "actual": 10.5
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3050.0,
    "actual": 3.05
  }
]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-5zero_shot117
[
  {
    "path": "data",
    "expected_len": 1,
    "actual_len": 3
  },
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": "Bergapur"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 6300.0,
    "actual": 10.5
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3050.0,
    "actual": 3.05
  }
]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-5raw_only117
[
  {
    "path": "data",
    "expected_len": 1,
    "actual_len": 3
  },
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": "Bergapur"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 6300.0,
    "actual": 10.5
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3050.0,
    "actual": 3.05
  }
]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-5db_plus_raw117
[
  {
    "path": "data",
    "expected_len": 1,
    "actual_len": 3
  },
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": "Bergapur"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 6300.0,
    "actual": 10.5
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3050.0,
    "actual": 3.05
  }
]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-5db_only117
[
  {
    "path": "data",
    "expected_len": 1,
    "actual_len": 3
  },
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": "Bergapur"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 6300.0,
    "actual": 10.5
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3050.0,
    "actual": 3.05
  }
]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-6db_only116
[
  {
    "path": "data[0].items[0].description",
    "expected": "TG - BP102",
    "actual": "BP102"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 23000.0,
    "actual": 23.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Busan"
  }
]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-5db_plus_raw116
[
  {
    "path": "data[0].items[0].description",
    "expected": "TG - BP102",
    "actual": "BP102"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 46000.0,
    "actual": 23.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Busan"
  }
]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonsonnet-4-5zero_shot116
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 9000.0,
    "actual": 9.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Jakarta",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Jakarta"
  }
]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-6zero_shot116
[
  {
    "path": "data",
    "expected_len": 1,
    "actual_len": 2
  },
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": "Bergapur"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 6300.0,
    "actual": 6.3
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3050.0,
    "actual": 3.05
  }
]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonsonnet-4-5raw_only116
[
  {
    "path": "data",
    "expected_len": 1,
    "actual_len": 3
  },
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": "Bergapur"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 6300.0,
    "actual": 10500.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "KG"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3050.0,
    "actual": 3.05
  }
]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-6zero_shot116
[
  {
    "path": "data",
    "expected_len": 1,
    "actual_len": 2
  },
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": "Bergapur"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 6300.0,
    "actual": 6.3
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3050.0,
    "actual": 3.05
  }
]
03__2026-01-30__120363403074656566_g_us__8f477a8f-2a60-4e0a-bf0e-8cc3cdf1dc9f.jsonopus-4-6db_only116
[
  {
    "path": "data",
    "expected_len": 1,
    "actual_len": 2
  },
  {
    "path": "data[0].items[0].description",
    "expected": "BergaPur",
    "actual": "Bergapur"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 6300.0,
    "actual": 6.3
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3050.0,
    "actual": 3.05
  }
]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-6raw_only116
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3250.0,
    "actual": 3.25
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
single_product_single_shipment_simple.jsonsonnet-4-6db_only115
[
  {
    "path": "data[0].items[0].description",
    "expected": "KNM Coffee",
    "actual": "BP102"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 5.0,
    "actual": 23.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "BAGS",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 25.0,
    "actual": 1410.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/BAG",
    "actual": "USD/MT"
  }
]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-6db_plus_raw115
[
  {
    "path": "data[0].items[0].description",
    "expected": "TG - BP102",
    "actual": "BP102"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 23000.0,
    "actual": 23.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Busan"
  }
]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-5db_plus_raw115
[
  {
    "path": "data[0].items[0].description",
    "expected": "TG - BP102",
    "actual": "BP102"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 23000.0,
    "actual": 23.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Busan"
  }
]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-5db_only115
[
  {
    "path": "data[0].items[0].description",
    "expected": "TG - BP102",
    "actual": "BP102"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 23000.0,
    "actual": 23.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Busan"
  }
]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-6db_plus_raw115
[
  {
    "path": "data[0].items[0].description",
    "expected": "TG - BP102",
    "actual": "BP102"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 23000.0,
    "actual": 23.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Busan"
  }
]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-5db_plus_raw115
[
  {
    "path": "data[0].items[0].description",
    "expected": "TG - BP102",
    "actual": "BP102"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 23000.0,
    "actual": 23.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Busan"
  }
]
09__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-5db_only115
[
  {
    "path": "data[0].items[0].description",
    "expected": "TG - BP102",
    "actual": "BP102"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 23000.0,
    "actual": 23.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Busan"
  }
]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-6zero_shot115
[
  {
    "path": "data[0].items[0].description",
    "expected": "TG - BP102",
    "actual": "BP102"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 46000.0,
    "actual": 23.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Busan"
  }
]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-6db_plus_raw115
[
  {
    "path": "data[0].items[0].description",
    "expected": "TG - BP102",
    "actual": "BP102"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 46000.0,
    "actual": 23.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Busan"
  }
]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonsonnet-4-5db_only115
[
  {
    "path": "data[0].items[0].description",
    "expected": "TG - BP102",
    "actual": "BP102"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 46000.0,
    "actual": 23.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Busan"
  }
]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-6db_plus_raw115
[
  {
    "path": "data[0].items[0].description",
    "expected": "TG - BP102",
    "actual": "BP102"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 46000.0,
    "actual": 23.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Busan"
  }
]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-6raw_only115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOIFNE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 26000.0,
    "actual": 26.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF NHAVA SHEVA",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Nhava Sheva"
  }
]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-6db_plus_raw115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOIFNE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 26000.0,
    "actual": 26.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF NHAVA SHEVA",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Nhava Sheva"
  }
]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-6raw_only115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 26000.0,
    "actual": 26.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF NHAVA SHEVA",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Nhava Sheva"
  }
]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-5raw_only115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOIFNE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 26000.0,
    "actual": 26.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF NHAVA SHEVA",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Nhava Sheva"
  }
]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-5db_plus_raw115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOIFNE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 26000.0,
    "actual": 26.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF NHAVA SHEVA",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Nhava Sheva"
  }
]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonsonnet-4-6db_plus_raw115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 9000.0,
    "actual": 9.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Jakarta",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Jakarta"
  }
]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonopus-4-6zero_shot115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 9000.0,
    "actual": 9.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Jakarta",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Jakarta"
  }
]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonopus-4-6db_only115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 9000.0,
    "actual": 9.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Jakarta",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Jakarta"
  }
]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonopus-4-5zero_shot115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 9000.0,
    "actual": 9.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Jakarta",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Jakarta"
  }
]
02__2026-02-09__120363426578757754_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-6zero_shot115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "Soya Lecithin Powder"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 39000.0,
    "actual": 39.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Nhava Sheva",
    "actual": "CIF"
  }
]
02__2026-02-09__120363426578757754_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-6raw_only115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "Soya Lecithin Powder"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 39000.0,
    "actual": 39.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Nhava Sheva",
    "actual": "CIF"
  }
]
02__2026-02-09__120363426578757754_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-6db_plus_raw115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "Soya Lecithin Powder"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 39000.0,
    "actual": 39.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Nhava Sheva",
    "actual": "CIF"
  }
]
02__2026-02-09__120363426578757754_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-6db_only115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "Soya Lecithin Powder"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 39000.0,
    "actual": 39.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Nhava Sheva",
    "actual": "CIF"
  }
]
02__2026-02-09__120363426578757754_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-5db_plus_raw115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "Soya Lecithin Powder"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 39000.0,
    "actual": 39.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Nhava Sheva",
    "actual": "CIF"
  }
]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-6zero_shot115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "EXW"
  }
]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-6db_plus_raw115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3250.0,
    "actual": 3.25
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-6db_only115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3250.0,
    "actual": 3.25
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-5zero_shot115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3250.0,
    "actual": 3.25
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-5db_only115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3250.0,
    "actual": 3.25
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-6zero_shot115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3250.0,
    "actual": 3.25
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-6db_plus_raw115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3250.0,
    "actual": 3.25
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-6db_only115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3250.0,
    "actual": 3.25
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-5zero_shot115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3250.0,
    "actual": 3.25
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-5raw_only115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3250.0,
    "actual": 3.25
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-5db_plus_raw115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3250.0,
    "actual": 3.25
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
01__2026-02-24__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-5db_only115
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3250.0,
    "actual": 3.25
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
08__2025-09-29__120363403592950429_g_us__d586d853-694c-42f9-93be-bc7ba5b2110c.jsonopus-4-5zero_shot114
[
  {
    "path": "data[0].items[0].description",
    "expected": "TG - BP102",
    "actual": "BP102"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 46000.0,
    "actual": 23.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/MT"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Busan"
  }
]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-6db_plus_raw114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3500.0,
    "actual": 3.5
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-6db_only114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3500.0,
    "actual": 3.5
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-5zero_shot114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3500.0,
    "actual": 3.5
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonsonnet-4-5db_only114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3500.0,
    "actual": 3.5
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-6zero_shot114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3500.0,
    "actual": 3.5
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-6db_plus_raw114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3500.0,
    "actual": 3.5
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-6db_only114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3500.0,
    "actual": 3.5
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-5zero_shot114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3500.0,
    "actual": 3.5
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-5raw_only114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3500.0,
    "actual": 3.5
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-5db_plus_raw114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3500.0,
    "actual": 3.5
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
06__2026-01-06__120363421131250401_g_us__e05574ec-b110-4554-9fc3-3abb4f9011a8.jsonopus-4-5db_only114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 1800.0,
    "actual": 1.8
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "kg",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 3500.0,
    "actual": 3.5
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "usd/mt",
    "actual": "USD/KG"
  }
]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-6zero_shot114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOIFNE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 26000.0,
    "actual": 26.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF NHAVA SHEVA",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Nhava Sheva"
  }
]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-6db_only114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOIFNE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 26000.0,
    "actual": 26.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF NHAVA SHEVA",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Nhava Sheva"
  }
]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-5db_plus_raw114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOIFNE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 26000.0,
    "actual": 26.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF NHAVA SHEVA",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Nhava Sheva"
  }
]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonsonnet-4-5db_only114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOIFNE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 26000.0,
    "actual": 26.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF NHAVA SHEVA",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Nhava Sheva"
  }
]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-6db_plus_raw114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOIFNE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 26000.0,
    "actual": 26.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF NHAVA SHEVA",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Nhava Sheva"
  }
]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-5zero_shot114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOIFNE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 26000.0,
    "actual": 26.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF NHAVA SHEVA",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Nhava Sheva"
  }
]
05__2026-01-20__120363407382355715_g_us__12a4f3a7-d506-4d32-ae06-3f76508c6abd.jsonopus-4-5db_only114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOIFNE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 26000.0,
    "actual": 26.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF NHAVA SHEVA",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Nhava Sheva"
  }
]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonsonnet-4-6db_only114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 9000.0,
    "actual": 9.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Jakarta",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Jakarta"
  }
]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonsonnet-4-5db_plus_raw114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 9000.0,
    "actual": 9.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Jakarta",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Jakarta"
  }
]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonsonnet-4-5db_only114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 9000.0,
    "actual": 9.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Jakarta",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Jakarta"
  }
]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonopus-4-6raw_only114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 9000.0,
    "actual": 9.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Jakarta",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Jakarta"
  }
]
04__2026-01-29__120363408498669191_g_us__4b9c2faa-94dd-4236-abcc-398807051f21.jsonopus-4-6db_plus_raw114
[
  {
    "path": "data[0].items[0].description",
    "expected": "GIIOFINE - P - S",
    "actual": "GIIOFINE-P-S"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 9000.0,
    "actual": 9.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "KG",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Jakarta",
    "actual": "CIF"
  },
  {
    "path": "data[0].items[0].delivery_terms",
    "expected": "",
    "actual": "CIF Jakarta"
  }
]