| { | |
| "model_type": "tinygpt-minimal", | |
| "vocab_size": 8192, | |
| "context_length": 512, | |
| "dim": 512, | |
| "n_layers": 6, | |
| "n_heads": 8, | |
| "mlp_ratio": 4.0, | |
| "resid_dropout": 0.1, | |
| "attn_dropout": 0.0, | |
| "tie_embeddings": true | |
| } |
| { | |
| "model_type": "tinygpt-minimal", | |
| "vocab_size": 8192, | |
| "context_length": 512, | |
| "dim": 512, | |
| "n_layers": 6, | |
| "n_heads": 8, | |
| "mlp_ratio": 4.0, | |
| "resid_dropout": 0.1, | |
| "attn_dropout": 0.0, | |
| "tie_embeddings": true | |
| } |