{
  "comparison": {
    "elements": 12288,
    "lhs": "fused_turboquant_gemv",
    "max_abs": 0.0078125,
    "max_abs_index": 2877,
    "max_rel": 4.591836929321289,
    "max_rel_index": 5205,
    "mean_abs": 0.0005096865255230417,
    "mean_rel": 0.009938551390329545,
    "rhs": "bulk_dequant_cublas",
    "rhs_rms": 0.3884690580087436,
    "rmse": 0.0009784491757410957,
    "rmse_over_rhs_rms": 0.002518731300651165
  },
  "first8": [
    {
      "abs_err": 0.0,
      "bulk_dequant_cublas": -0.28515625,
      "fused_gemv": -0.28515625,
      "index": 0,
      "rel_err": 0.0
    },
    {
      "abs_err": 0.0009765625,
      "bulk_dequant_cublas": 0.1123046875,
      "fused_gemv": 0.11328125,
      "index": 1,
      "rel_err": 0.008695651777088642
    },
    {
      "abs_err": 0.001953125,
      "bulk_dequant_cublas": -0.208984375,
      "fused_gemv": -0.2109375,
      "index": 2,
      "rel_err": 0.009345794096589088
    },
    {
      "abs_err": 0.0006103515625,
      "bulk_dequant_cublas": -0.0262451171875,
      "fused_gemv": -0.025634765625,
      "index": 3,
      "rel_err": 0.023255813866853714
    },
    {
      "abs_err": 0.001953125,
      "bulk_dequant_cublas": -0.134765625,
      "fused_gemv": -0.13671875,
      "index": 4,
      "rel_err": 0.014492753893136978
    },
    {
      "abs_err": 0.0,
      "bulk_dequant_cublas": 0.5234375,
      "fused_gemv": 0.5234375,
      "index": 5,
      "rel_err": 0.0
    },
    {
      "abs_err": 0.001953125,
      "bulk_dequant_cublas": 0.267578125,
      "fused_gemv": 0.265625,
      "index": 6,
      "rel_err": 0.007299270015209913
    },
    {
      "abs_err": 0.00048828125,
      "bulk_dequant_cublas": -0.068359375,
      "fused_gemv": -0.06787109375,
      "index": 7,
      "rel_err": 0.0071428571827709675
    }
  ],
  "input": {
    "first8": [
      0.60546875,
      0.466796875,
      -0.35546875,
      -0.48828125,
      -0.984375,
      0.216796875,
      -0.12890625,
      -0.52734375
    ],
    "shape": [
      1,
      4096
    ]
  },
  "model_path": "/home/ckl/.cache/modelscope/hub/Qwen/Qwen3___5-9B-TQ4",
  "projection": {
    "bits": 4,
    "cols": 4096,
    "group_size": 128,
    "num_groups": 32,
    "packed_cols": 2048,
    "rows": 12288
  },
  "seed": 1592594996,
  "tensor_base": "model.language_model.layers.0.mlp.up_proj"
}
