update model card README.md
Browse files
README.md
CHANGED
@@ -61,7 +61,7 @@ The following hyperparameters were used during training:
|
|
61 |
'skip_tokens': 1649934336},
|
62 |
'generation': {'batch_size': 128,
|
63 |
'every_n_steps': 256,
|
64 |
-
'force_call_on': [
|
65 |
'metrics_configs': [{}, {'n': 1}, {}],
|
66 |
'scenario_configs': [{'display_as_html': True,
|
67 |
'generate_kwargs': {'do_sample': True,
|
@@ -89,7 +89,7 @@ The following hyperparameters were used during training:
|
|
89 |
'use_prompt_for_scoring': True}],
|
90 |
'scorer_config': {}},
|
91 |
'kl_gpt3_callback': {'every_n_steps': 256,
|
92 |
-
'force_call_on': [
|
93 |
'gpt3_kwargs': {'model_name': 'code-cushman-001'},
|
94 |
'max_tokens': 64,
|
95 |
'num_samples': 4096},
|
@@ -115,7 +115,7 @@ The following hyperparameters were used during training:
|
|
115 |
'per_device_train_batch_size': 16,
|
116 |
'push_to_hub': True,
|
117 |
'remove_unused_columns': False,
|
118 |
-
'save_steps':
|
119 |
'save_strategy': 'steps',
|
120 |
'seed': 42,
|
121 |
'tokens_already_seen': 1649934336,
|
@@ -123,4 +123,4 @@ The following hyperparameters were used during training:
|
|
123 |
'weight_decay': 0.1}}
|
124 |
|
125 |
# Wandb URL:
|
126 |
-
https://wandb.ai/kejian/uncategorized/runs/
|
|
|
61 |
'skip_tokens': 1649934336},
|
62 |
'generation': {'batch_size': 128,
|
63 |
'every_n_steps': 256,
|
64 |
+
'force_call_on': [12588],
|
65 |
'metrics_configs': [{}, {'n': 1}, {}],
|
66 |
'scenario_configs': [{'display_as_html': True,
|
67 |
'generate_kwargs': {'do_sample': True,
|
|
|
89 |
'use_prompt_for_scoring': True}],
|
90 |
'scorer_config': {}},
|
91 |
'kl_gpt3_callback': {'every_n_steps': 256,
|
92 |
+
'force_call_on': [12588],
|
93 |
'gpt3_kwargs': {'model_name': 'code-cushman-001'},
|
94 |
'max_tokens': 64,
|
95 |
'num_samples': 4096},
|
|
|
115 |
'per_device_train_batch_size': 16,
|
116 |
'push_to_hub': True,
|
117 |
'remove_unused_columns': False,
|
118 |
+
'save_steps': 12588,
|
119 |
'save_strategy': 'steps',
|
120 |
'seed': 42,
|
121 |
'tokens_already_seen': 1649934336,
|
|
|
123 |
'weight_decay': 0.1}}
|
124 |
|
125 |
# Wandb URL:
|
126 |
+
https://wandb.ai/kejian/uncategorized/runs/3mpa7db7
|