kejian
/

mighty-conditional

@@ -36,9 +36,11 @@ More information needed
 The following hyperparameters were used during training:
 - learning_rate: 0.0008
-- train_batch_size: 64
-- eval_batch_size: 32
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_ratio: 0.01
@@ -60,7 +62,7 @@ The following hyperparameters were used during training:
                                              'threshold': 0},
              'datasets': ['kejian/codeparrot-train-more-filter-3.3b-cleaned'],
              'is_split_by_sentences': True},
- 'generation': {'batch_size': 64,
                 'metrics_configs': [{}, {'n': 1}, {}],
                 'scenario_configs': [{'display_as_html': True,
                                       'generate_kwargs': {'bad_words_ids': [[32769]],
@@ -73,7 +75,7 @@ The following hyperparameters were used during training:
                                                           'top_p': 0.9},
                                       'name': 'unconditional',
                                       'num_hits_threshold': 0,
-                                      'num_samples': 4096,
                                       'prefix': '<|aligned|>',
                                       'use_prompt_for_scoring': False},
                                      {'display_as_html': True,
@@ -87,7 +89,7 @@ The following hyperparameters were used during training:
                                                           'top_p': 0.9},
                                       'name': 'functions',
                                       'num_hits_threshold': 0,
-                                      'num_samples': 4096,
                                       'prefix': '<|aligned|>',
                                       'prompt_before_control': True,
                                       'prompts_path': 'resources/functions_csnet.jsonl',
@@ -127,4 +129,4 @@ The following hyperparameters were used during training:
               'weight_decay': 0.1}}
 # Wandb URL:
-https://wandb.ai/kejian/uncategorized/runs/h0khl32b

 The following hyperparameters were used during training:
 - learning_rate: 0.0008
+- train_batch_size: 32
+- eval_batch_size: 16
 - seed: 42
+- gradient_accumulation_steps: 2
+- total_train_batch_size: 64
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_ratio: 0.01
                                              'threshold': 0},
              'datasets': ['kejian/codeparrot-train-more-filter-3.3b-cleaned'],
              'is_split_by_sentences': True},
+ 'generation': {'batch_size': 128,
                 'metrics_configs': [{}, {'n': 1}, {}],
                 'scenario_configs': [{'display_as_html': True,
                                       'generate_kwargs': {'bad_words_ids': [[32769]],
                                                           'top_p': 0.9},
                                       'name': 'unconditional',
                                       'num_hits_threshold': 0,
+                                      'num_samples': 2048,
                                       'prefix': '<|aligned|>',
                                       'use_prompt_for_scoring': False},
                                      {'display_as_html': True,
                                                           'top_p': 0.9},
                                       'name': 'functions',
                                       'num_hits_threshold': 0,
+                                      'num_samples': 2048,
                                       'prefix': '<|aligned|>',
                                       'prompt_before_control': True,
                                       'prompts_path': 'resources/functions_csnet.jsonl',
               'weight_decay': 0.1}}
 # Wandb URL:
+https://wandb.ai/kejian/uncategorized/runs/zpigcpaa