SYNTH-GPT2-MYOPIC-L_conv-10_shift-0_lr-0.0001_n_embd-128_n_head-2_n_layer-3_activation_function-relu_global_step=7815.0_val_loss=1.18.ckpt