sign
/

AmitMY's picture
Upload args.yaml with huggingface_hub
4d1b0cf
allow_missing_params: false
amp: false
apex_amp: false
batch_sentences_multiple_of: 8
batch_size: 512
batch_type: word
bow_task_pos_weight: 10
bow_task_weight: 1.0
bucket_scaling: false
bucket_width: 8
cache_last_best_params: 0
cache_metric: perplexity
cache_strategy: best
checkpoint_improvement_threshold: 0.0
checkpoint_interval: 4000
clamp_to_dtype: false
config: null
decode_and_evaluate: 500
decoder: transformer
deepspeed_bf16: false
deepspeed_fp16: false
device_id: 0
dist: false
dry_run: false
dtype: float32
embed_dropout:
- 0.0
- 0.0
encoder: transformer
end_of_prepending_tag: null
env: null
fixed_param_names: []
fixed_param_strategy: null
gradient_clipping_threshold: 1.0
gradient_clipping_type: none
ignore_extra_params: false
initial_learning_rate: 0.0002
keep_initializations: false
keep_last_params: -1
label_smoothing: 0.1
label_smoothing_impl: mxnet
learning_rate_reduce_factor: 0.9
learning_rate_reduce_num_not_improved: 8
learning_rate_scheduler_type: plateau-reduce
learning_rate_warmup: 0
length_task: null
length_task_layers: 1
length_task_weight: 1.0
lhuc: null
local_rank: null
loglevel: INFO
loglevel_secondary_workers: INFO
max_checkpoints: null
max_num_checkpoint_not_improved: 20
max_num_epochs: null
max_samples: null
max_seconds: null
max_seq_len:
- 512
- 128
max_updates: null
min_num_epochs: null
min_samples: null
min_updates: null
momentum: 0.0
neural_vocab_selection: null
neural_vocab_selection_block_loss: false
no_bucketing: false
no_logfile: false
no_reload_on_learning_rate_reduce: false
num_embed:
- null
- null
num_layers:
- 6
- 6
num_words:
- 0
- 0
optimized_metric: chrf
optimizer: adam
optimizer_betas:
- 0.9
- 0.999
optimizer_eps: 1.0e-08
output: /shares/volk.cl.uzh/amoryo/checkpoints/sockeye/expanded-cleaned/model
overwrite_output: false
pad_vocab_to_multiple_of: 8
params: /shares/volk.cl.uzh/amoryo/checkpoints/sockeye/expanded/model/params.best
prepared_data: /shares/volk.cl.uzh/amoryo/checkpoints/sockeye/expanded-cleaned/train_data
quiet: false
quiet_secondary_workers: false
seed: 1
shared_vocab: false
source: null
source_factor_vocabs: []
source_factors: []
source_factors_combine: []
source_factors_num_embed: []
source_factors_share_embedding: []
source_factors_use_source_vocab: []
source_vocab: null
stop_training_on_decoder_failure: false
target: null
target_factor_vocabs: []
target_factors: []
target_factors_combine: []
target_factors_num_embed: []
target_factors_share_embedding: []
target_factors_use_target_vocab: []
target_factors_weight:
- 1.0
target_vocab: null
tf32: true
transformer_activation_type:
- relu
- relu
transformer_attention_heads:
- 8
- 8
transformer_block_prepended_cross_attention: false
transformer_dropout_act: &id001
- 0.1
- 0.1
transformer_dropout_attention: *id001
transformer_dropout_prepost: *id001
transformer_feed_forward_num_hidden:
- 2048
- 2048
transformer_feed_forward_use_glu: false
transformer_model_size:
- 512
- 512
transformer_positional_embedding_type: fixed
transformer_postprocess:
- dr
- dr
transformer_preprocess:
- n
- n
update_interval: 1
use_cpu: false
validation_source: /home/amoryo/sign-language/signbank-annotation/signbank-plus/data/parallel/cleaned/dev.source.tokenized
validation_source_factors: []
validation_target: /shares/volk.cl.uzh/amoryo/checkpoints/sockeye/expanded-cleaned/dev.target.bpe
validation_target_factors: []
weight_decay: 0.0
weight_tying_type: none
word_min_count:
- 1
- 1