Few-shot Benchmark Report

Run ID: 20260505T180307Z | Generated UTC: 2026-05-05T18:07:21.150598+00:00

Configuration

{
  "models": [
    "opus-4-5",
    "opus-4-6",
    "sonnet-4-5",
    "sonnet-4-6"
  ],
  "fewshot_strategies": [
    "db_only",
    "db_plus_raw",
    "raw_only",
    "zero_shot"
  ],
  "chat_count": 12,
  "runs_per_chat": 2,
  "max_workers": 15,
  "raw_fewshot_count": 26,
  "raw_fewshot_labels_filter": []
}

Model + Strategy Summary

ModelStrategyRunsSuccess rateAvg attempts Avg elapsed (s)Avg mismatch/expected runField match rate
opus-4-5db_only241.00001.00009.007315.45830.5726
opus-4-5db_plus_raw241.00001.000012.797915.08330.5829
opus-4-5raw_only241.00001.000021.717714.20830.6071
opus-4-5zero_shot241.00001.00006.528112.91670.5216
opus-4-6db_only241.00001.00008.439116.41670.4903
opus-4-6db_plus_raw241.00001.000019.815615.25000.5783
opus-4-6raw_only241.00001.00007.212815.50000.5714
opus-4-6zero_shot241.00001.00006.07429.79170.5165
sonnet-4-5db_only241.00001.00008.658715.00000.5663
sonnet-4-5db_plus_raw241.00001.00009.041915.75000.5645
sonnet-4-5raw_only241.00001.00007.836315.87500.5611
sonnet-4-5zero_shot241.00001.00006.777511.95830.5176
sonnet-4-6db_only241.00001.00007.766716.04170.5565
sonnet-4-6db_plus_raw241.00001.00009.047114.95830.5864
sonnet-4-6raw_only241.00001.00007.192815.29170.5772
sonnet-4-6zero_shot241.00001.00006.789113.04170.5437

Per-chat Breakdown

ChatModelStrategyRuns Success rateAvg elapsed (s)Mismatch counts
multiple_product_multiple_shipment_complex.jsonopus-4-5db_only21.000013.4062[41, 41]
multiple_product_multiple_shipment_complex.jsonopus-4-5db_plus_raw21.000011.9343[43, 41]
multiple_product_multiple_shipment_complex.jsonopus-4-5raw_only21.000024.5134[40, 40]
multiple_product_multiple_shipment_complex.jsonopus-4-5zero_shot21.000011.8529[41, 41]
multiple_product_multiple_shipment_complex.jsonopus-4-6db_only21.000013.1892[47, 47]
multiple_product_multiple_shipment_complex.jsonopus-4-6db_plus_raw21.000013.3903[38, 38]
multiple_product_multiple_shipment_complex.jsonopus-4-6raw_only21.000012.0736[40, 40]
multiple_product_multiple_shipment_complex.jsonopus-4-6zero_shot21.00009.3648[10, 10]
multiple_product_multiple_shipment_complex.jsonsonnet-4-5db_only21.000012.6261[38, 40]
multiple_product_multiple_shipment_complex.jsonsonnet-4-5db_plus_raw21.000014.4224[41, 41]
multiple_product_multiple_shipment_complex.jsonsonnet-4-5raw_only21.000012.8820[38, 41]
multiple_product_multiple_shipment_complex.jsonsonnet-4-5zero_shot21.000011.1218[11, 30]
multiple_product_multiple_shipment_complex.jsonsonnet-4-6db_only21.000010.3423[38, 38]
multiple_product_multiple_shipment_complex.jsonsonnet-4-6db_plus_raw21.000012.0421[38, 33]
multiple_product_multiple_shipment_complex.jsonsonnet-4-6raw_only21.000011.2341[37, 37]
multiple_product_multiple_shipment_complex.jsonsonnet-4-6zero_shot21.000010.5679[31, 31]
multiple_product_multiple_shipment_medium.jsonopus-4-5db_only21.000010.4988[24, 24]
multiple_product_multiple_shipment_medium.jsonopus-4-5db_plus_raw21.00009.7952[22, 22]
multiple_product_multiple_shipment_medium.jsonopus-4-5raw_only21.000023.0609[19, 22]
multiple_product_multiple_shipment_medium.jsonopus-4-5zero_shot21.00007.9537[24, 24]
multiple_product_multiple_shipment_medium.jsonopus-4-6db_only21.000010.2524[24, 24]
multiple_product_multiple_shipment_medium.jsonopus-4-6db_plus_raw21.00009.9708[24, 24]
multiple_product_multiple_shipment_medium.jsonopus-4-6raw_only21.00008.2871[22, 22]
multiple_product_multiple_shipment_medium.jsonopus-4-6zero_shot21.00006.7422[11, 11]
multiple_product_multiple_shipment_medium.jsonsonnet-4-5db_only21.00009.5209[24, 24]
multiple_product_multiple_shipment_medium.jsonsonnet-4-5db_plus_raw21.000011.0477[20, 24]
multiple_product_multiple_shipment_medium.jsonsonnet-4-5raw_only21.00008.5159[22, 22]
multiple_product_multiple_shipment_medium.jsonsonnet-4-5zero_shot21.00007.8221[24, 26]
multiple_product_multiple_shipment_medium.jsonsonnet-4-6db_only21.00008.5846[24, 24]
multiple_product_multiple_shipment_medium.jsonsonnet-4-6db_plus_raw21.000010.5435[24, 24]
multiple_product_multiple_shipment_medium.jsonsonnet-4-6raw_only21.00007.7728[22, 22]
multiple_product_multiple_shipment_medium.jsonsonnet-4-6zero_shot21.00007.6468[25, 22]
multiple_product_multiple_shipment_simple.jsonopus-4-5db_only21.00009.5594[16, 16]
multiple_product_multiple_shipment_simple.jsonopus-4-5db_plus_raw21.00008.3421[16, 16]
multiple_product_multiple_shipment_simple.jsonopus-4-5raw_only21.000020.3248[14, 14]
multiple_product_multiple_shipment_simple.jsonopus-4-5zero_shot21.00005.9148[12, 12]
multiple_product_multiple_shipment_simple.jsonopus-4-6db_only21.00008.0840[12, 27]
multiple_product_multiple_shipment_simple.jsonopus-4-6db_plus_raw21.000018.7685[16, 18]
multiple_product_multiple_shipment_simple.jsonopus-4-6raw_only21.00007.0049[18, 18]
multiple_product_multiple_shipment_simple.jsonopus-4-6zero_shot21.00005.8224[13, 13]
multiple_product_multiple_shipment_simple.jsonsonnet-4-5db_only21.00007.2254[10, 10]
multiple_product_multiple_shipment_simple.jsonsonnet-4-5db_plus_raw21.00009.0899[16, 16]
multiple_product_multiple_shipment_simple.jsonsonnet-4-5raw_only21.00008.1257[18, 16]
multiple_product_multiple_shipment_simple.jsonsonnet-4-5zero_shot21.00006.1588[13, 13]
multiple_product_multiple_shipment_simple.jsonsonnet-4-6db_only21.00006.9738[16, 16]
multiple_product_multiple_shipment_simple.jsonsonnet-4-6db_plus_raw21.00008.4032[16, 16]
multiple_product_multiple_shipment_simple.jsonsonnet-4-6raw_only21.00007.0220[17, 16]
multiple_product_multiple_shipment_simple.jsonsonnet-4-6zero_shot21.00005.8578[12, 12]
real_world_msgs_test_v1.jsonopus-4-5db_only21.00009.1291[11, 8]
real_world_msgs_test_v1.jsonopus-4-5db_plus_raw21.00007.1828[8, 8]
real_world_msgs_test_v1.jsonopus-4-5raw_only21.000017.3862[8, 8]
real_world_msgs_test_v1.jsonopus-4-5zero_shot21.00005.0774[8, 8]
real_world_msgs_test_v1.jsonopus-4-6db_only21.00006.8878[8, 8]
real_world_msgs_test_v1.jsonopus-4-6db_plus_raw21.000029.3460[8, 8]
real_world_msgs_test_v1.jsonopus-4-6raw_only21.00005.9718[8, 8]
real_world_msgs_test_v1.jsonopus-4-6zero_shot21.00005.2084[10, 10]
real_world_msgs_test_v1.jsonsonnet-4-5db_only21.00008.6640[11, 11]
real_world_msgs_test_v1.jsonsonnet-4-5db_plus_raw21.00008.7967[11, 11]
real_world_msgs_test_v1.jsonsonnet-4-5raw_only21.00007.3437[12, 12]
real_world_msgs_test_v1.jsonsonnet-4-5zero_shot21.00006.2823[11, 11]
real_world_msgs_test_v1.jsonsonnet-4-6db_only21.00006.9921[8, 8]
real_world_msgs_test_v1.jsonsonnet-4-6db_plus_raw21.00006.7997[8, 8]
real_world_msgs_test_v1.jsonsonnet-4-6raw_only21.00005.3427[9, 9]
real_world_msgs_test_v1.jsonsonnet-4-6zero_shot21.00005.1170[10, 10]
real_world_msgs_test_v2.jsonopus-4-5db_only21.00008.6968[13, 13]
real_world_msgs_test_v2.jsonopus-4-5db_plus_raw21.00007.6117[13, 13]
real_world_msgs_test_v2.jsonopus-4-5raw_only21.000029.3183[13, 13]
real_world_msgs_test_v2.jsonopus-4-5zero_shot21.00007.2797[13, 13]
real_world_msgs_test_v2.jsonopus-4-6db_only21.00008.0128[13, 13]
real_world_msgs_test_v2.jsonopus-4-6db_plus_raw21.000026.2668[13, 13]
real_world_msgs_test_v2.jsonopus-4-6raw_only21.00007.4627[13, 13]
real_world_msgs_test_v2.jsonopus-4-6zero_shot21.00006.4021[13, 14]
real_world_msgs_test_v2.jsonsonnet-4-5db_only21.00008.3810[13, 13]
real_world_msgs_test_v2.jsonsonnet-4-5db_plus_raw21.00009.2966[13, 13]
real_world_msgs_test_v2.jsonsonnet-4-5raw_only21.00007.5710[17, 17]
real_world_msgs_test_v2.jsonsonnet-4-5zero_shot21.00006.7523[13, 13]
real_world_msgs_test_v2.jsonsonnet-4-6db_only21.00006.9755[13, 13]
real_world_msgs_test_v2.jsonsonnet-4-6db_plus_raw21.00007.6709[13, 13]
real_world_msgs_test_v2.jsonsonnet-4-6raw_only21.00007.2782[16, 16]
real_world_msgs_test_v2.jsonsonnet-4-6zero_shot21.00008.1861[14, 14]
real_world_msgs_test_v3.jsonopus-4-5db_only21.00008.9480[13, 13]
real_world_msgs_test_v3.jsonopus-4-5db_plus_raw21.00007.3866[13, 13]
real_world_msgs_test_v3.jsonopus-4-5raw_only21.000024.0110[13, 13]
real_world_msgs_test_v3.jsonopus-4-5zero_shot21.00005.9911[9, 9]
real_world_msgs_test_v3.jsonopus-4-6db_only21.00008.1748[13, 13]
real_world_msgs_test_v3.jsonopus-4-6db_plus_raw21.000029.0950[13, 13]
real_world_msgs_test_v3.jsonopus-4-6raw_only21.00007.0847[13, 13]
real_world_msgs_test_v3.jsonopus-4-6zero_shot21.00006.0732[9, 9]
real_world_msgs_test_v3.jsonsonnet-4-5db_only21.00008.4088[13, 13]
real_world_msgs_test_v3.jsonsonnet-4-5db_plus_raw21.00008.3666[17, 17]
real_world_msgs_test_v3.jsonsonnet-4-5raw_only21.00007.5119[17, 17]
real_world_msgs_test_v3.jsonsonnet-4-5zero_shot21.00007.1396[9, 9]
real_world_msgs_test_v3.jsonsonnet-4-6db_only21.00006.7129[13, 13]
real_world_msgs_test_v3.jsonsonnet-4-6db_plus_raw21.00008.7110[13, 13]
real_world_msgs_test_v3.jsonsonnet-4-6raw_only21.00006.9232[13, 13]
real_world_msgs_test_v3.jsonsonnet-4-6zero_shot21.00005.7824[11, 11]
single_product_multiple_shipment_complex.jsonopus-4-5db_only21.000010.6272[22, 22]
single_product_multiple_shipment_complex.jsonopus-4-5db_plus_raw21.00009.1463[22, 22]
single_product_multiple_shipment_complex.jsonopus-4-5raw_only21.000027.7767[19, 19]
single_product_multiple_shipment_complex.jsonopus-4-5zero_shot21.00007.0074[11, 11]
single_product_multiple_shipment_complex.jsonopus-4-6db_only21.00008.8402[12, 12]
single_product_multiple_shipment_complex.jsonopus-4-6db_plus_raw21.000028.5284[22, 22]
single_product_multiple_shipment_complex.jsonopus-4-6raw_only21.00008.8787[25, 25]
single_product_multiple_shipment_complex.jsonopus-4-6zero_shot21.00007.1064[11, 11]
single_product_multiple_shipment_complex.jsonsonnet-4-5db_only21.000010.6799[22, 22]
single_product_multiple_shipment_complex.jsonsonnet-4-5db_plus_raw21.000010.7180[21, 21]
single_product_multiple_shipment_complex.jsonsonnet-4-5raw_only21.000010.0674[19, 19]
single_product_multiple_shipment_complex.jsonsonnet-4-5zero_shot21.00007.6867[11, 11]
single_product_multiple_shipment_complex.jsonsonnet-4-6db_only21.000010.7506[22, 22]
single_product_multiple_shipment_complex.jsonsonnet-4-6db_plus_raw21.000011.4762[22, 22]
single_product_multiple_shipment_complex.jsonsonnet-4-6raw_only21.000011.2134[22, 22]
single_product_multiple_shipment_complex.jsonsonnet-4-6zero_shot21.00008.2816[11, 11]
single_product_multiple_shipment_medium.jsonopus-4-5db_only21.00009.2031[17, 17]
single_product_multiple_shipment_medium.jsonopus-4-5db_plus_raw21.00008.3981[17, 17]
single_product_multiple_shipment_medium.jsonopus-4-5raw_only21.000020.5861[17, 17]
single_product_multiple_shipment_medium.jsonopus-4-5zero_shot21.00006.0220[12, 12]
single_product_multiple_shipment_medium.jsonopus-4-6db_only21.00008.7698[19, 19]
single_product_multiple_shipment_medium.jsonopus-4-6db_plus_raw21.000027.0612[17, 19]
single_product_multiple_shipment_medium.jsonopus-4-6raw_only21.00007.5534[17, 17]
single_product_multiple_shipment_medium.jsonopus-4-6zero_shot21.00006.0306[12, 12]
single_product_multiple_shipment_medium.jsonsonnet-4-5db_only21.00009.0231[17, 17]
single_product_multiple_shipment_medium.jsonsonnet-4-5db_plus_raw21.00008.1665[17, 17]
single_product_multiple_shipment_medium.jsonsonnet-4-5raw_only21.00007.7417[17, 17]
single_product_multiple_shipment_medium.jsonsonnet-4-5zero_shot21.00006.4371[12, 12]
single_product_multiple_shipment_medium.jsonsonnet-4-6db_only21.00007.6027[17, 17]
single_product_multiple_shipment_medium.jsonsonnet-4-6db_plus_raw21.000013.3270[17, 17]
single_product_multiple_shipment_medium.jsonsonnet-4-6raw_only21.00007.0010[17, 17]
single_product_multiple_shipment_medium.jsonsonnet-4-6zero_shot21.00006.9483[19, 19]
single_product_multiple_shipment_simple.jsonopus-4-5db_only21.00007.2896[14, 14]
single_product_multiple_shipment_simple.jsonopus-4-5db_plus_raw21.000020.9075[13, 12]
single_product_multiple_shipment_simple.jsonopus-4-5raw_only21.000019.7298[12, 12]
single_product_multiple_shipment_simple.jsonopus-4-5zero_shot21.00006.0084[10, 9]
single_product_multiple_shipment_simple.jsonopus-4-6db_only21.00008.4985[23, 23]
single_product_multiple_shipment_simple.jsonopus-4-6db_plus_raw21.000023.0870[14, 14]
single_product_multiple_shipment_simple.jsonopus-4-6raw_only21.00006.6646[14, 14]
single_product_multiple_shipment_simple.jsonopus-4-6zero_shot21.00005.6699[10, 10]
single_product_multiple_shipment_simple.jsonsonnet-4-5db_only21.00008.9361[14, 14]
single_product_multiple_shipment_simple.jsonsonnet-4-5db_plus_raw21.00008.1629[14, 14]
single_product_multiple_shipment_simple.jsonsonnet-4-5raw_only21.00007.4617[13, 13]
single_product_multiple_shipment_simple.jsonsonnet-4-5zero_shot21.00006.6643[10, 10]
single_product_multiple_shipment_simple.jsonsonnet-4-6db_only21.00006.9893[14, 14]
single_product_multiple_shipment_simple.jsonsonnet-4-6db_plus_raw21.00009.0193[14, 14]
single_product_multiple_shipment_simple.jsonsonnet-4-6raw_only21.00006.5538[14, 14]
single_product_multiple_shipment_simple.jsonsonnet-4-6zero_shot21.00005.9300[9, 9]
single_product_single_shipment_complex.jsonopus-4-5db_only21.00006.6842[4, 4]
single_product_single_shipment_complex.jsonopus-4-5db_plus_raw21.000021.8049[4, 4]
single_product_single_shipment_complex.jsonopus-4-5raw_only21.000021.0643[3, 3]
single_product_single_shipment_complex.jsonopus-4-5zero_shot21.00004.8121[3, 6]
single_product_single_shipment_complex.jsonopus-4-6db_only21.00007.2630[5, 5]
single_product_single_shipment_complex.jsonopus-4-6db_plus_raw21.000018.6269[4, 4]
single_product_single_shipment_complex.jsonopus-4-6raw_only21.00005.1209[4, 4]
single_product_single_shipment_complex.jsonopus-4-6zero_shot21.00004.7135[6, 6]
single_product_single_shipment_complex.jsonsonnet-4-5db_only21.00007.8461[5, 5]
single_product_single_shipment_complex.jsonsonnet-4-5db_plus_raw21.00006.6891[5, 5]
single_product_single_shipment_complex.jsonsonnet-4-5raw_only21.00006.0804[5, 5]
single_product_single_shipment_complex.jsonsonnet-4-5zero_shot21.00005.3951[5, 5]
single_product_single_shipment_complex.jsonsonnet-4-6db_only21.00006.6700[5, 5]
single_product_single_shipment_complex.jsonsonnet-4-6db_plus_raw21.00007.2455[5, 5]
single_product_single_shipment_complex.jsonsonnet-4-6raw_only21.00005.8954[5, 5]
single_product_single_shipment_complex.jsonsonnet-4-6zero_shot21.00007.9609[3, 5]
single_product_single_shipment_medium.jsonopus-4-5db_only21.00006.8616[5, 5]
single_product_single_shipment_medium.jsonopus-4-5db_plus_raw21.000018.8684[4, 5]
single_product_single_shipment_medium.jsonopus-4-5raw_only21.000027.9534[4, 4]
single_product_single_shipment_medium.jsonopus-4-5zero_shot21.00005.2085[4, 4]
single_product_single_shipment_medium.jsonopus-4-6db_only21.00006.8168[6, 7]
single_product_single_shipment_medium.jsonopus-4-6db_plus_raw21.00007.2542[5, 5]
single_product_single_shipment_medium.jsonopus-4-6raw_only21.00005.4114[5, 5]
single_product_single_shipment_medium.jsonopus-4-6zero_shot21.00004.9310[5, 5]
single_product_single_shipment_medium.jsonsonnet-4-5db_only21.00006.6914[5, 5]
single_product_single_shipment_medium.jsonsonnet-4-5db_plus_raw21.00007.3883[5, 5]
single_product_single_shipment_medium.jsonsonnet-4-5raw_only21.00005.8366[5, 5]
single_product_single_shipment_medium.jsonsonnet-4-5zero_shot21.00005.0717[6, 6]
single_product_single_shipment_medium.jsonsonnet-4-6db_only21.00007.6573[6, 5]
single_product_single_shipment_medium.jsonsonnet-4-6db_plus_raw21.00007.0603[5, 5]
single_product_single_shipment_medium.jsonsonnet-4-6raw_only21.00005.0431[5, 5]
single_product_single_shipment_medium.jsonsonnet-4-6zero_shot21.00004.5857[5, 5]
single_product_single_shipment_simple.jsonopus-4-5db_only21.00007.1831[7, 7]
single_product_single_shipment_simple.jsonopus-4-5db_plus_raw21.000022.1966[7, 7]
single_product_single_shipment_simple.jsonopus-4-5raw_only21.00004.8875[7, 7]
single_product_single_shipment_simple.jsonopus-4-5zero_shot21.00005.2086[7, 7]
single_product_single_shipment_simple.jsonopus-4-6db_only21.00006.4802[7, 7]
single_product_single_shipment_simple.jsonopus-4-6db_plus_raw21.00006.3922[7, 7]
single_product_single_shipment_simple.jsonopus-4-6raw_only21.00005.0399[7, 7]
single_product_single_shipment_simple.jsonopus-4-6zero_shot21.00004.8259[7, 7]
single_product_single_shipment_simple.jsonsonnet-4-5db_only21.00005.9010[7, 7]
single_product_single_shipment_simple.jsonsonnet-4-5db_plus_raw21.00006.3576[7, 7]
single_product_single_shipment_simple.jsonsonnet-4-5raw_only21.00004.8972[7, 7]
single_product_single_shipment_simple.jsonsonnet-4-5zero_shot21.00004.7984[8, 8]
single_product_single_shipment_simple.jsonsonnet-4-6db_only21.00006.9497[17, 17]
single_product_single_shipment_simple.jsonsonnet-4-6db_plus_raw21.00006.2664[7, 7]
single_product_single_shipment_simple.jsonsonnet-4-6raw_only21.00005.0337[7, 7]
single_product_single_shipment_simple.jsonsonnet-4-6zero_shot21.00004.6042[7, 7]

Top Mismatches (up to 100 runs)

ChatModelStrategyRunMismatch countSample mismatches
multiple_product_multiple_shipment_complex.jsonopus-4-6db_only147
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonopus-4-6db_only247
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonopus-4-5db_plus_raw243
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonsonnet-4-5raw_only241
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonsonnet-4-5db_plus_raw141
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonsonnet-4-5db_plus_raw241
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonopus-4-5zero_shot241
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonopus-4-5zero_shot141
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonopus-4-5db_plus_raw141
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonopus-4-5db_only141
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonopus-4-5db_only241
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonsonnet-4-5db_only140
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonopus-4-6raw_only140
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonopus-4-6raw_only240
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonopus-4-5raw_only240
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonopus-4-5raw_only140
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonsonnet-4-6db_plus_raw138
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonsonnet-4-6db_only138
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonsonnet-4-6db_only238
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonsonnet-4-5raw_only138
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonsonnet-4-5db_only238
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonopus-4-6db_plus_raw238
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonopus-4-6db_plus_raw138
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonsonnet-4-6raw_only137
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonsonnet-4-6raw_only237
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  }
]
multiple_product_multiple_shipment_complex.jsonsonnet-4-6db_plus_raw233
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  }
]
multiple_product_multiple_shipment_complex.jsonsonnet-4-6zero_shot131
[
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].payment_date",
    "expected": [
      "Net 30 from first delivery",
      "Net 30",
      "2026-03-30"
    ],
    "actual": ""
  }
]
multiple_product_multiple_shipment_complex.jsonsonnet-4-6zero_shot231
[
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].total",
    "expected": 276.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].payment_date",
    "expected": [
      "Net 30 from first delivery",
      "Net 30",
      "2026-03-30"
    ],
    "actual": ""
  }
]
multiple_product_multiple_shipment_complex.jsonsonnet-4-5zero_shot230
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.0,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  }
]
multiple_product_multiple_shipment_simple.jsonopus-4-6db_only227
[
  {
    "path": "data[0].items[0].description",
    "expected": "KNM Coffee",
    "actual": "lecithin fat powder"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 10.0,
    "actual": 8.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 25.0,
    "actual": 12.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/KG"
  }
]
multiple_product_multiple_shipment_medium.jsonsonnet-4-5zero_shot226
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": ""
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
single_product_multiple_shipment_complex.jsonopus-4-6raw_only125
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].payment_date",
    "expected": [
      "Net 30 from last delivery",
      "Net 30",
      "2026-04-08"
    ],
    "actual": ""
  }
]
single_product_multiple_shipment_complex.jsonopus-4-6raw_only225
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].payment_date",
    "expected": [
      "Net 30 from last delivery",
      "Net 30",
      "2026-04-08"
    ],
    "actual": ""
  }
]
multiple_product_multiple_shipment_medium.jsonsonnet-4-6zero_shot125
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAGS"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 3600.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonsonnet-4-6db_plus_raw124
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonsonnet-4-6db_plus_raw224
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonsonnet-4-6db_only224
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonsonnet-4-6db_only124
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonsonnet-4-5zero_shot124
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonsonnet-4-5db_plus_raw224
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonsonnet-4-5db_only124
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonsonnet-4-5db_only224
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonopus-4-6db_plus_raw124
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonopus-4-6db_plus_raw224
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonopus-4-6db_only124
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonopus-4-6db_only224
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonopus-4-5zero_shot124
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": null
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": ""
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonopus-4-5zero_shot224
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonopus-4-5db_only224
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonopus-4-5db_only124
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
single_product_multiple_shipment_simple.jsonopus-4-6db_only123
[
  {
    "path": "data[0].items[0].description",
    "expected": "KNM Coffee",
    "actual": "lecithin fat powder"
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 25.0,
    "actual": 12.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/KG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 375.0,
    "actual": 96000.0
  }
]
single_product_multiple_shipment_simple.jsonopus-4-6db_only223
[
  {
    "path": "data[0].items[0].description",
    "expected": "KNM Coffee",
    "actual": "lecithin fat powder"
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 25.0,
    "actual": 12.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/KG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 375.0,
    "actual": 96000.0
  }
]
single_product_multiple_shipment_complex.jsonsonnet-4-6raw_only122
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].payment_date",
    "expected": [
      "Net 30 from last delivery",
      "Net 30",
      "2026-04-08"
    ],
    "actual": ""
  }
]
single_product_multiple_shipment_complex.jsonsonnet-4-6raw_only222
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].payment_date",
    "expected": [
      "Net 30 from last delivery",
      "Net 30",
      "2026-04-08"
    ],
    "actual": ""
  }
]
single_product_multiple_shipment_complex.jsonsonnet-4-6db_plus_raw122
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].payment_date",
    "expected": [
      "Net 30 from last delivery",
      "Net 30",
      "2026-04-08"
    ],
    "actual": ""
  }
]
single_product_multiple_shipment_complex.jsonsonnet-4-6db_plus_raw222
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].payment_date",
    "expected": [
      "Net 30 from last delivery",
      "Net 30",
      "2026-04-08"
    ],
    "actual": ""
  }
]
single_product_multiple_shipment_complex.jsonsonnet-4-6db_only122
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].payment_date",
    "expected": [
      "Net 30 from last delivery",
      "Net 30",
      "2026-04-08"
    ],
    "actual": ""
  }
]
single_product_multiple_shipment_complex.jsonsonnet-4-6db_only222
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].payment_date",
    "expected": [
      "Net 30 from last delivery",
      "Net 30",
      "2026-04-08"
    ],
    "actual": ""
  }
]
single_product_multiple_shipment_complex.jsonsonnet-4-5db_only222
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].payment_date",
    "expected": [
      "Net 30 from last delivery",
      "Net 30",
      "2026-04-08"
    ],
    "actual": ""
  }
]
single_product_multiple_shipment_complex.jsonsonnet-4-5db_only122
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].payment_date",
    "expected": [
      "Net 30 from last delivery",
      "Net 30",
      "2026-04-08"
    ],
    "actual": ""
  }
]
single_product_multiple_shipment_complex.jsonopus-4-6db_plus_raw222
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].payment_date",
    "expected": [
      "Net 30 from last delivery",
      "Net 30",
      "2026-04-08"
    ],
    "actual": ""
  }
]
single_product_multiple_shipment_complex.jsonopus-4-6db_plus_raw122
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].payment_date",
    "expected": [
      "Net 30 from last delivery",
      "Net 30",
      "2026-04-08"
    ],
    "actual": ""
  }
]
single_product_multiple_shipment_complex.jsonopus-4-5db_plus_raw222
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].payment_date",
    "expected": [
      "Net 30 from last delivery",
      "Net 30",
      "2026-04-08"
    ],
    "actual": ""
  }
]
single_product_multiple_shipment_complex.jsonopus-4-5db_plus_raw122
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].payment_date",
    "expected": [
      "Net 30 from last delivery",
      "Net 30",
      "2026-04-08"
    ],
    "actual": ""
  }
]
single_product_multiple_shipment_complex.jsonopus-4-5db_only122
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].payment_date",
    "expected": [
      "Net 30 from last delivery",
      "Net 30",
      "2026-04-08"
    ],
    "actual": ""
  }
]
single_product_multiple_shipment_complex.jsonopus-4-5db_only222
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].payment_date",
    "expected": [
      "Net 30 from last delivery",
      "Net 30",
      "2026-04-08"
    ],
    "actual": ""
  }
]
multiple_product_multiple_shipment_medium.jsonsonnet-4-6zero_shot222
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  }
]
multiple_product_multiple_shipment_medium.jsonsonnet-4-6raw_only122
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  }
]
multiple_product_multiple_shipment_medium.jsonsonnet-4-6raw_only222
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  }
]
multiple_product_multiple_shipment_medium.jsonsonnet-4-5raw_only122
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonsonnet-4-5raw_only222
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonopus-4-6raw_only122
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonopus-4-6raw_only222
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonopus-4-5raw_only222
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonopus-4-5db_plus_raw122
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
multiple_product_multiple_shipment_medium.jsonopus-4-5db_plus_raw222
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].total",
    "expected": 285.0,
    "actual": 300.0
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  }
]
single_product_multiple_shipment_complex.jsonsonnet-4-5db_plus_raw121
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].payment_date",
    "expected": [
      "Net 30 from last delivery",
      "Net 30",
      "2026-04-08"
    ],
    "actual": ""
  }
]
single_product_multiple_shipment_complex.jsonsonnet-4-5db_plus_raw221
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].payment_date",
    "expected": [
      "Net 30 from last delivery",
      "Net 30",
      "2026-04-08"
    ],
    "actual": ""
  }
]
multiple_product_multiple_shipment_medium.jsonsonnet-4-5db_plus_raw120
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  }
]
single_product_multiple_shipment_medium.jsonsonnet-4-6zero_shot219
[
  {
    "path": "data[0].items[0].description",
    "expected": "KNM Coffee",
    "actual": "KNM Coffee (medium roast)"
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Singapore",
    "actual": "CIF"
  },
  {
    "path": "data[0].do_date",
    "expected": "2026-04-30",
    "actual": "2026-05-31"
  }
]
single_product_multiple_shipment_medium.jsonsonnet-4-6zero_shot119
[
  {
    "path": "data[0].items[0].description",
    "expected": "KNM Coffee",
    "actual": "KNM Coffee (medium roast)"
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Singapore",
    "actual": "CIF"
  },
  {
    "path": "data[0].do_date",
    "expected": "2026-04-30",
    "actual": "2026-05-31"
  }
]
single_product_multiple_shipment_medium.jsonopus-4-6db_plus_raw219
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Singapore",
    "actual": "CIF"
  },
  {
    "path": "data[0].do_date",
    "expected": "2026-04-30",
    "actual": "2026-05-31"
  },
  {
    "path": "data[0].po_ref_no",
    "expected": "PO-2025-11-180",
    "actual": ""
  }
]
single_product_multiple_shipment_medium.jsonopus-4-6db_only119
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Singapore",
    "actual": "CIF"
  },
  {
    "path": "data[0].do_date",
    "expected": "2026-04-30",
    "actual": "2026-05-31"
  },
  {
    "path": "data[0].po_ref_no",
    "expected": "PO-2025-11-180",
    "actual": ""
  }
]
single_product_multiple_shipment_medium.jsonopus-4-6db_only219
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Singapore",
    "actual": "CIF"
  },
  {
    "path": "data[0].do_date",
    "expected": "2026-04-30",
    "actual": "2026-05-31"
  },
  {
    "path": "data[0].po_ref_no",
    "expected": "PO-2025-11-180",
    "actual": ""
  }
]
single_product_multiple_shipment_complex.jsonsonnet-4-5raw_only119
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].billing_address",
    "expected": [],
    "actual": "Leonardo da Vinci, da@vinci.com"
  }
]
single_product_multiple_shipment_complex.jsonsonnet-4-5raw_only219
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].billing_address",
    "expected": [],
    "actual": "Leonardo da Vinci, da@vinci.com"
  }
]
single_product_multiple_shipment_complex.jsonopus-4-5raw_only219
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].billing_address",
    "expected": [],
    "actual": ""
  }
]
single_product_multiple_shipment_complex.jsonopus-4-5raw_only119
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "FOB Singapore",
    "actual": "FOB"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  },
  {
    "path": "data[0].billing_address",
    "expected": [],
    "actual": ""
  }
]
multiple_product_multiple_shipment_medium.jsonopus-4-5raw_only119
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 23.75,
    "actual": 25.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "EXW Singapore",
    "actual": "EXW"
  },
  {
    "path": "data[0].vendor_name",
    "expected": "flamingos",
    "actual": "Van Beethoven"
  }
]
multiple_product_multiple_shipment_simple.jsonsonnet-4-5raw_only118
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Singapore",
    "actual": "CIF"
  },
  {
    "path": "data[0].do_date",
    "expected": "2026-04-30",
    "actual": "2026-05-31"
  },
  {
    "path": "data[0].po_ref_no",
    "expected": "PO-2024-11-200",
    "actual": "PO-2025-11-200"
  }
]
multiple_product_multiple_shipment_simple.jsonopus-4-6raw_only118
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Singapore",
    "actual": "CIF"
  },
  {
    "path": "data[0].do_date",
    "expected": "2026-04-30",
    "actual": "2026-05-31"
  },
  {
    "path": "data[0].po_ref_no",
    "expected": "PO-2024-11-200",
    "actual": "PO-2025-11-200"
  }
]
multiple_product_multiple_shipment_simple.jsonopus-4-6raw_only218
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Singapore",
    "actual": "CIF"
  },
  {
    "path": "data[0].do_date",
    "expected": "2026-04-30",
    "actual": "2026-05-31"
  },
  {
    "path": "data[0].po_ref_no",
    "expected": "PO-2024-11-200",
    "actual": "PO-2025-11-200"
  }
]
multiple_product_multiple_shipment_simple.jsonopus-4-6db_plus_raw218
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Singapore",
    "actual": "CIF"
  },
  {
    "path": "data[0].do_date",
    "expected": "2026-04-30",
    "actual": "2026-05-31"
  },
  {
    "path": "data[0].po_ref_no",
    "expected": "PO-2024-11-200",
    "actual": "PO-2025-11-200"
  }
]
single_product_single_shipment_simple.jsonsonnet-4-6db_only217
[
  {
    "path": "data[0].items[0].description",
    "expected": "KNM Coffee",
    "actual": "BP102"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 5.0,
    "actual": 23.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 25.0,
    "actual": 1410.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/MT"
  }
]
single_product_single_shipment_simple.jsonsonnet-4-6db_only117
[
  {
    "path": "data[0].items[0].description",
    "expected": "KNM Coffee",
    "actual": "BP102"
  },
  {
    "path": "data[0].items[0].quantity",
    "expected": 5.0,
    "actual": 23.0
  },
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "MT"
  },
  {
    "path": "data[0].items[0].unit_price",
    "expected": 25.0,
    "actual": 1410.0
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/MT"
  }
]
single_product_multiple_shipment_medium.jsonsonnet-4-6raw_only117
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Singapore",
    "actual": "CIF"
  },
  {
    "path": "data[0].do_date",
    "expected": "2026-04-30",
    "actual": "2026-05-31"
  },
  {
    "path": "data[0].po_ref_no",
    "expected": "PO-2025-11-180",
    "actual": ""
  }
]
single_product_multiple_shipment_medium.jsonsonnet-4-6raw_only217
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Singapore",
    "actual": "CIF"
  },
  {
    "path": "data[0].do_date",
    "expected": "2026-04-30",
    "actual": "2026-05-31"
  },
  {
    "path": "data[0].po_ref_no",
    "expected": "PO-2025-11-180",
    "actual": ""
  }
]
single_product_multiple_shipment_medium.jsonsonnet-4-6db_plus_raw217
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Singapore",
    "actual": "CIF"
  },
  {
    "path": "data[0].do_date",
    "expected": "2026-04-30",
    "actual": "2026-05-31"
  },
  {
    "path": "data[0].po_ref_no",
    "expected": "PO-2025-11-180",
    "actual": ""
  }
]
single_product_multiple_shipment_medium.jsonsonnet-4-6db_plus_raw117
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Singapore",
    "actual": "CIF"
  },
  {
    "path": "data[0].do_date",
    "expected": "2026-04-30",
    "actual": "2026-05-31"
  },
  {
    "path": "data[0].po_ref_no",
    "expected": "PO-2025-11-180",
    "actual": ""
  }
]
single_product_multiple_shipment_medium.jsonsonnet-4-6db_only117
[
  {
    "path": "data[0].items[0].quantity_unit",
    "expected": "bags",
    "actual": "BAGS"
  },
  {
    "path": "data[0].items[0].pricing_unit",
    "expected": "USD/bag",
    "actual": "USD/BAG"
  },
  {
    "path": "data[0].items[0].ship_term",
    "expected": "CIF Singapore",
    "actual": "CIF"
  },
  {
    "path": "data[0].do_date",
    "expected": "2026-04-30",
    "actual": "2026-05-31"
  },
  {
    "path": "data[0].po_ref_no",
    "expected": "PO-2025-11-180",
    "actual": ""
  }
]