summaryrefslogtreecommitdiff
path: root/data/tokenizer_specs.json
blob: d7ad1ca0571ef43acaba3695af44f12deee43fc2 (plain)
1
2
3
4
5
6
7
8
9
{
  "tokenizers": [
    {
      "name": "sp_bpe_1024",
      "dataset_suffix": "sp1024",
      "vocab_size": 1024
    }
  ]
}