ImageGuard / lora /config.yaml
adwardlee's picture
Upload folder using huggingface_hub
33a11e7 verified
data_cfg:
data_cfg:
eval:
JsonDataset:
base_path: data
fairness: true
generated_ratio: 1.0
real_ratio: 1.0
safety: true
SMID:
base_path: data/evaluator_test/SMID
SelfHarm:
base_path: data/evaluator_test/self-harm
UnsafeBench:
base_path: data/evaluator_test/UnsafeBench
UnsafeDiff:
base_path: data/evaluator_test/Unsafe_diff
ViolentBehavior:
base_path: data/evaluator_test/Violent_behavior
train:
base_path: data
fairness: true
generated_ratio: 1.0
max_face_length: 2000
max_generated_dim_length: 6000
max_real_dim_length: 600
real_ratio: 1.0
safe_ratio: 0.3
safety: true
verion: 3
lora_cfg:
lora_alpha: 256
lora_bias: none
lora_dropout: 0.05
lora_r: 256
lora_target_modules:
- attention.wqkv
- attention.wo
- feed_forward.w1
- feed_forward.w2
- feed_forward.w3
lora_type: lora
lora_weight_path: ''
model_cfg:
model_name_or_path: model_zoo/internlm-xcomposer2-vl-7b
training_cfg:
_n_gpu: 1
accelerator_config:
dispatch_batches: null
even_batches: true
gradient_accumulation_kwargs: null
non_blocking: false
split_batches: false
use_seedable_sampler: true
adafactor: false
adam_beta1: 0.9
adam_beta2: 0.95
adam_epsilon: 1.0e-08
auto_find_batch_size: false
batch_eval_metrics: false
bf16: true
bf16_full_eval: false
cache_dir: null
data_seed: null
dataloader_drop_last: false
dataloader_num_workers: 0
dataloader_persistent_workers: false
dataloader_pin_memory: true
dataloader_prefetch_factor: null
ddp_backend: null
ddp_broadcast_buffers: null
ddp_bucket_cap_mb: null
ddp_find_unused_parameters: null
ddp_timeout: 1800
debug: []
deepspeed: scripts/ds_config_zero2.json
disable_tqdm: false
dispatch_batches: null
do_eval: true
do_predict: false
do_train: false
eval_accumulation_steps: null
eval_delay: 0
eval_do_concat_batches: true
eval_steps: null
fix_sampler: false
fix_vit: true
fp16: false
fp16_backend: auto
fp16_full_eval: false
fp16_opt_level: O1
fsdp: []
fsdp_config:
min_num_params: 0
xla: false
xla_fsdp_grad_ckpt: false
xla_fsdp_v2: false
fsdp_min_num_params: 0
fsdp_transformer_layer_cls_to_wrap: null
full_determinism: false
gradient_accumulation_steps: 1
gradient_checkpointing: true
gradient_checkpointing_kwargs: null
greater_is_better: null
group_by_length: false
half_precision_backend: auto
hub_always_push: false
hub_model_id: null
hub_private_repo: false
hub_token: null
ignore_data_skip: false
include_inputs_for_metrics: false
include_num_input_tokens_seen: false
include_tokens_per_second: false
jit_mode_eval: false
label_names:
- samples
label_smoothing_factor: 0.0
learning_rate: 5.0e-05
length_column_name: length
load_best_model_at_end: false
local_rank: 7
log_level: passive
log_level_replica: warning
log_on_each_node: true
logging_dir: output/internlm/datav3_1/safe0.3_lr5e-5_decay1e-2_nocap_e2//safe0.3_nocap
logging_first_step: false
logging_nan_inf_filter: true
logging_steps: 10
lr_scheduler_kwargs: {}
max_grad_norm: 1.0
max_length: 4096
max_steps: -1
metric_for_best_model: null
mp_parameters: ''
neftune_noise_alpha: null
no_cuda: false
num_train_epochs: 2.0
optim_args: null
optim_target_modules: null
output_dir: output/internlm/datav3_1/safe0.3_lr5e-5_decay1e-2_nocap_e2//safe0.3_nocap
overwrite_output_dir: false
past_index: -1
per_device_eval_batch_size: 8
per_device_train_batch_size: 8
per_gpu_eval_batch_size: null
per_gpu_train_batch_size: null
prediction_loss_only: false
push_to_hub: false
push_to_hub_model_id: null
push_to_hub_organization: null
push_to_hub_token: null
ray_scope: last
remove_unused_columns: true
report_to: []
restore_callback_states_from_checkpoint: false
resume_from_checkpoint: null
run_name: output/internlm/datav3_1/safe0.3_lr5e-5_decay1e-2_nocap_e2//safe0.3_nocap
save_on_each_node: false
save_only_model: false
save_safetensors: true
save_steps: 500
save_total_limit: 1
seed: 3407
skip_memory_metrics: true
split_batches: null
tf32: null
torch_compile: false
torch_compile_backend: null
torch_compile_mode: null
torchdynamo: null
tpu_metrics_debug: false
tpu_num_cores: null
use_cpu: false
use_ipex: false
use_legacy_prediction_loop: false
use_lora: true
use_mps_device: false
warmup_ratio: 0.01
warmup_steps: 0
weight_decay: 0.01