versae's picture
Step... (1000/50000 | Loss: 1.7686773538589478, Acc: 0.6487793326377869): 3%|▊ | 1286/50000 [29:40<20:20:20, 1.50s/it]
cefa210
raw
history blame
1.6 kB
{
"os": "Linux-5.4.0-1043-gcp-x86_64-with-glibc2.29",
"python": "3.8.10",
"heartbeatAt": "2021-07-26T00:12:35.406409",
"startedAt": "2021-07-26T00:12:33.305928",
"docker": null,
"cpu_count": 96,
"cuda": null,
"args": [
"--model_name_or_path=bertin-project/bertin-base-stepwise",
"--output_dir=./outputs",
"--model_type=roberta",
"--config_name=./configs/base",
"--tokenizer_name=./configs/base",
"--dataset_name=bertin-project/mc4-es-sampled",
"--dataset_config_name=stepwise",
"--max_seq_length=512",
"--pad_to_max_length",
"--per_device_train_batch_size=48",
"--per_device_eval_batch_size=48",
"--adam_beta1=0.9",
"--adam_beta2=0.98",
"--adam_epsilon=1e-6",
"--learning_rate=6e-4",
"--weight_decay=0.01",
"--save_steps=1000",
"--save_total_limit=5",
"--warmup_steps=500",
"--overwrite_output_dir",
"--num_train_steps=50000",
"--eval_steps=1000",
"--dtype=bfloat16",
"--logging_steps=500"
],
"state": "running",
"program": "./run_mlm_flax_stream.py",
"codePath": "run_mlm_flax_stream.py",
"git": {
"remote": "https://huggingface.co/bertin-project/bertin-base-stepwise-exp-512seqlen",
"commit": "529e26d977dcd80df13f8ff4dc528756c974c3b3"
},
"email": "[email protected]",
"root": "/var/hf/experiment-base-exp-512seq-stepwise",
"host": "tablespoon",
"username": "versae",
"executable": "/var/hf/venv/bin/python"
}