blob: 07c58c39c2d9b468bbacc9fc7e44f3f139d9a5aa (
plain)
1
2
3
4
5
6
7
8
9
10
11
|
{
"author": "samuellarson",
"github_id": "samuellarson",
"name": "Int6 MLP3x Sliding Window",
"blurb": "Int6 post-training quantization enables 3x MLP expansion (21.8M params in 16MB). Combined with train@2048 + sliding window eval + FP16 tied embeddings + Late-K passthrough.",
"date": "2026-03-20",
"val_loss": 1.95428963,
"val_bpb": 1.15744040,
"bytes_total": 15977717,
"bytes_code": 51200
}
|