{"n_layer": 24, "n_head": 16, "n_embd": 1024, "block_size": 1024, "bias": false, "input_vocab_size": 129600, "output_vocab_size": 10048, "dropout": 0.0} |
{"n_layer": 24, "n_head": 16, "n_embd": 1024, "block_size": 1024, "bias": false, "input_vocab_size": 129600, "output_vocab_size": 10048, "dropout": 0.0} |