sign
/

sockeye-signwriting-to-text

Model card Files Files and versions Community

sockeye-signwriting-to-text / args.yaml

AmitMY's picture

Upload args.yaml with huggingface_hub

4d1b0cf about 1 year ago

history blame contribute delete

3.42 kB

	allow_missing_params: false
	amp: false
	apex_amp: false
	batch_sentences_multiple_of: 8
	batch_size: 512
	batch_type: word
	bow_task_pos_weight: 10
	bow_task_weight: 1.0
	bucket_scaling: false
	bucket_width: 8
	cache_last_best_params: 0
	cache_metric: perplexity
	cache_strategy: best
	checkpoint_improvement_threshold: 0.0
	checkpoint_interval: 4000
	clamp_to_dtype: false
	config: null
	decode_and_evaluate: 500
	decoder: transformer
	deepspeed_bf16: false
	deepspeed_fp16: false
	device_id: 0
	dist: false
	dry_run: false
	dtype: float32
	embed_dropout:
	- 0.0
	- 0.0
	encoder: transformer
	end_of_prepending_tag: null
	env: null
	fixed_param_names: []
	fixed_param_strategy: null
	gradient_clipping_threshold: 1.0
	gradient_clipping_type: none
	ignore_extra_params: false
	initial_learning_rate: 0.0002
	keep_initializations: false
	keep_last_params: -1
	label_smoothing: 0.1
	label_smoothing_impl: mxnet
	learning_rate_reduce_factor: 0.9
	learning_rate_reduce_num_not_improved: 8
	learning_rate_scheduler_type: plateau-reduce
	learning_rate_warmup: 0
	length_task: null
	length_task_layers: 1
	length_task_weight: 1.0
	lhuc: null
	local_rank: null
	loglevel: INFO
	loglevel_secondary_workers: INFO
	max_checkpoints: null
	max_num_checkpoint_not_improved: 20
	max_num_epochs: null
	max_samples: null
	max_seconds: null
	max_seq_len:
	- 512
	- 128
	max_updates: null
	min_num_epochs: null
	min_samples: null
	min_updates: null
	momentum: 0.0
	neural_vocab_selection: null
	neural_vocab_selection_block_loss: false
	no_bucketing: false
	no_logfile: false
	no_reload_on_learning_rate_reduce: false
	num_embed:
	- null
	- null
	num_layers:
	- 6
	- 6
	num_words:
	- 0
	- 0
	optimized_metric: chrf
	optimizer: adam
	optimizer_betas:
	- 0.9
	- 0.999
	optimizer_eps: 1.0e-08
	output: /shares/volk.cl.uzh/amoryo/checkpoints/sockeye/expanded-cleaned/model
	overwrite_output: false
	pad_vocab_to_multiple_of: 8
	params: /shares/volk.cl.uzh/amoryo/checkpoints/sockeye/expanded/model/params.best
	prepared_data: /shares/volk.cl.uzh/amoryo/checkpoints/sockeye/expanded-cleaned/train_data
	quiet: false
	quiet_secondary_workers: false
	seed: 1
	shared_vocab: false
	source: null
	source_factor_vocabs: []
	source_factors: []
	source_factors_combine: []
	source_factors_num_embed: []
	source_factors_share_embedding: []
	source_factors_use_source_vocab: []
	source_vocab: null
	stop_training_on_decoder_failure: false
	target: null
	target_factor_vocabs: []
	target_factors: []
	target_factors_combine: []
	target_factors_num_embed: []
	target_factors_share_embedding: []
	target_factors_use_target_vocab: []
	target_factors_weight:
	- 1.0
	target_vocab: null
	tf32: true
	transformer_activation_type:
	- relu
	- relu
	transformer_attention_heads:
	- 8
	- 8
	transformer_block_prepended_cross_attention: false
	transformer_dropout_act: &id001
	- 0.1
	- 0.1
	transformer_dropout_attention: *id001
	transformer_dropout_prepost: *id001
	transformer_feed_forward_num_hidden:
	- 2048
	- 2048
	transformer_feed_forward_use_glu: false
	transformer_model_size:
	- 512
	- 512
	transformer_positional_embedding_type: fixed
	transformer_postprocess:
	- dr
	- dr
	transformer_preprocess:
	- n
	- n
	update_interval: 1
	use_cpu: false
	validation_source: /home/amoryo/sign-language/signbank-annotation/signbank-plus/data/parallel/cleaned/dev.source.tokenized
	validation_source_factors: []
	validation_target: /shares/volk.cl.uzh/amoryo/checkpoints/sockeye/expanded-cleaned/dev.target.bpe
	validation_target_factors: []
	weight_decay: 0.0
	weight_tying_type: none
	word_min_count:
	- 1
	- 1