GPT2-NECK-SWEEP_20240119-135624-D1b52_dataset_name-msmarco_hidden_idxs-11_hidden_lb-0_neck_cls-mlp_pretrained-1_token_lb-0_epoch=03-val_self_loss=5.08.ckpt