GPT2-NECK-SWEEP_20240119-183427-53E8C_dataset_name-msmarco_hidden_idxs-11_hidden_lb-0_neck_cls-lstm_pretrained-1_token_lb-0_epoch=02-val_self_loss=4.32.ckpt