File size: 1,595 Bytes
cefa210
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
{
    "os": "Linux-5.4.0-1043-gcp-x86_64-with-glibc2.29",
    "python": "3.8.10",
    "heartbeatAt": "2021-07-26T00:12:35.406409",
    "startedAt": "2021-07-26T00:12:33.305928",
    "docker": null,
    "cpu_count": 96,
    "cuda": null,
    "args": [
        "--model_name_or_path=bertin-project/bertin-base-stepwise",
        "--output_dir=./outputs",
        "--model_type=roberta",
        "--config_name=./configs/base",
        "--tokenizer_name=./configs/base",
        "--dataset_name=bertin-project/mc4-es-sampled",
        "--dataset_config_name=stepwise",
        "--max_seq_length=512",
        "--pad_to_max_length",
        "--per_device_train_batch_size=48",
        "--per_device_eval_batch_size=48",
        "--adam_beta1=0.9",
        "--adam_beta2=0.98",
        "--adam_epsilon=1e-6",
        "--learning_rate=6e-4",
        "--weight_decay=0.01",
        "--save_steps=1000",
        "--save_total_limit=5",
        "--warmup_steps=500",
        "--overwrite_output_dir",
        "--num_train_steps=50000",
        "--eval_steps=1000",
        "--dtype=bfloat16",
        "--logging_steps=500"
    ],
    "state": "running",
    "program": "./run_mlm_flax_stream.py",
    "codePath": "run_mlm_flax_stream.py",
    "git": {
        "remote": "https://huggingface.co/bertin-project/bertin-base-stepwise-exp-512seqlen",
        "commit": "529e26d977dcd80df13f8ff4dc528756c974c3b3"
    },
    "email": "[email protected]",
    "root": "/var/hf/experiment-base-exp-512seq-stepwise",
    "host": "tablespoon",
    "username": "versae",
    "executable": "/var/hf/venv/bin/python"
}