GPT2-NECK-SWEEP_20240120-002841-FA105_dataset_name-msmarco_hidden_idxs-12_hidden_lb-0_neck_cls-lstm_pretrained-0_token_lb-0_epoch=01-val_self_loss=10.68.ckpt