| { | |
| "vocab": 32768, | |
| "d": 1024, | |
| "layers": 12, | |
| "heads": 16, | |
| "seq": 2048, | |
| "ff": 4, | |
| "arch": "SelectionCoder", | |
| "stage": "ideal-sft", | |
| "step": 3000 | |
| } |
| { | |
| "vocab": 32768, | |
| "d": 1024, | |
| "layers": 12, | |
| "heads": 16, | |
| "seq": 2048, | |
| "ff": 4, | |
| "arch": "SelectionCoder", | |
| "stage": "ideal-sft", | |
| "step": 3000 | |
| } |