|
project: |
|
project: starvector-8b-text2svg |
|
use_wandb: false |
|
entity: joanrod |
|
copy_code: false |
|
model: |
|
max_length: 16000 |
|
model_name: starvector/starvector-8b-im2svg |
|
starcoder_model_name: bigcode/starcoder2-7b |
|
pretrained: true |
|
image_encoder_type: siglip_384 |
|
use_flash_attn: true |
|
adapter_norm: layer_norm |
|
init_type: normal |
|
dropout: 0.1 |
|
task: text2svg |
|
transformer_layer_cls: Starcoder2DecoderLayer |
|
use_cache: false |
|
training: |
|
save_model_epochs: 1 |
|
checkpointing_steps: 500 |
|
checkpoints_total_limit: 5 |
|
model_precision: bf16 |
|
resume_from_checkpoint: false |
|
continue_training: false |
|
n_epochs: 4 |
|
lr: 0.00001 |
|
gradient_accumulation_steps: 4 |
|
lr_scheduler: cosine |
|
lr_warmup_steps: 10 |
|
adam_beta1: 0.95 |
|
adam_beta2: 0.999 |
|
adam_weight_decay: 1.0e-06 |
|
adam_epsilon: 1e-08 |
|
optimizer: adamw |
|
use_gradient_checkpointing: true |
|
train_image_encoder: true |
|
train_LLM: true |
|
fsdp: |
|
enable: true |
|
cpu_offload: false |
|
sharding_strategy: hsdp |
|
backward_prefetch: BACKWARD_PRE |
|
use_orig_params: true |
|
sync_module_states: true |
|
forward_prefetch: false |
|
cpu_ram_efficient_loading: true |
|
data: |
|
num_workers: 16 |
|
train: |
|
batch_size: 4 |
|
target: starvector.data.stacksvg.SVGStackDataset |
|
params: |
|
split: train |
|
dataset_name: starvector/text2svg-stack |
|
im_size: 384 |
|
num_samples: -1 |
|
transforms: false |
|
select_dataset_name: false |
|
image_processor: siglip_384 |
|
test: |
|
batch_size: 4 |
|
target: starvector.data.stacksvg.SVGStackDataset |
|
params: |
|
split: test |
|
dataset_name: starvector/text2svg-stack |
|
im_size: 384 |
|
num_samples: 64 |
|
transforms: false |
|
select_dataset_name: false |
|
image_processor: siglip_384 |
|
generation: |
|
max_length: 10000 |
|
min_length: 10 |
|
num_beams: 3 |
|
temperature: 1.0 |
|
num_captions: 1 |
|
repetition_penalty: 1.0 |
|
length_penalty: 0.5 |
|
top_p: 0.95 |
|
use_nucleus_sampling: true |
|
im_size: 384 |
|
dpi: 2 |
|
scale: 300 |
|
metrics: |
|
L2: false |
|
Masked-L2: false |
|
LPIPS: false |
|
SSIM: false |
|
FID: false |
|
FID_clip: false |
|
CLIPScore: true |
|
CountTokenLength: true |
|
ratio_post_processed: false |
|
ratio_non_compiling: false |
|
DinoScore: false |