{ "head_dim": 128, "metadata": { "dataset": "kmfoda/booksum", "model": "Qwen/Qwen3-8B", "n_future_positions": 500, "n_samples": 100, "n_sink": 4 }, "num_heads": 32, "num_layers": 36 }