| { | |
| "architectures": [ | |
| "SimCSEModel" | |
| ], | |
| "base_model": "klue/roberta-base", | |
| "batch_size": 64, | |
| "dataset_dir": "/opt/ml/input/data/training/", | |
| "debug": "False", | |
| "device": "cuda:0", | |
| "eval_steps": 50, | |
| "local_rank": 0, | |
| "lr": 3e-05, | |
| "lr_scheduler_type": "linear", | |
| "max_seq_len": 64, | |
| "num_epochs": 1, | |
| "num_warmup_steps": 0, | |
| "output_dir": "/opt/ml/model/", | |
| "rank": 0, | |
| "save_path": "../model", | |
| "seed": 42, | |
| "temperature": 0.05, | |
| "torch_dtype": "float32", | |
| "transformers_version": "4.33.3", | |
| "use_fp16": "False", | |
| "version": 1.0, | |
| "world_size": 4 | |
| } | |