Spaces:
Running
Running
| project: | |
| project: starvector-8b-text2svg | |
| use_wandb: false | |
| entity: joanrod | |
| copy_code: false | |
| model: | |
| max_length: 16000 | |
| model_name: starvector/starvector-8b-im2svg | |
| starcoder_model_name: bigcode/starcoder2-7b | |
| pretrained: true | |
| image_encoder_type: siglip_384 | |
| use_flash_attn: true | |
| adapter_norm: layer_norm | |
| init_type: normal | |
| dropout: 0.1 | |
| task: text2svg | |
| transformer_layer_cls: Starcoder2DecoderLayer # fsdp specific | |
| use_cache: false | |
| training: | |
| save_model_epochs: 1 | |
| checkpointing_steps: 500 | |
| checkpoints_total_limit: 5 | |
| model_precision: bf16 | |
| resume_from_checkpoint: false | |
| continue_training: false | |
| n_epochs: 4 | |
| lr: 0.00001 | |
| gradient_accumulation_steps: 4 | |
| lr_scheduler: cosine | |
| lr_warmup_steps: 10 | |
| adam_beta1: 0.95 | |
| adam_beta2: 0.999 | |
| adam_weight_decay: 1.0e-06 | |
| adam_epsilon: 1e-08 | |
| optimizer: adamw | |
| use_gradient_checkpointing: true | |
| train_image_encoder: true | |
| train_LLM: true | |
| fsdp: | |
| enable: true # TODO: set this reasonably, i.e., false only if you want to use DDP or have PyTorch < 2.1 | |
| cpu_offload: false | |
| sharding_strategy: hsdp | |
| backward_prefetch: BACKWARD_PRE | |
| use_orig_params: true | |
| sync_module_states: true | |
| forward_prefetch: false | |
| cpu_ram_efficient_loading: true | |
| data: | |
| num_workers: 16 | |
| train: | |
| batch_size: 4 | |
| target: starvector.data.stacksvg.SVGStackDataset | |
| params: | |
| split: train | |
| dataset_name: starvector/text2svg-stack | |
| im_size: 384 | |
| num_samples: -1 | |
| transforms: false | |
| select_dataset_name: false | |
| image_processor: siglip_384 | |
| test: | |
| batch_size: 4 | |
| target: starvector.data.stacksvg.SVGStackDataset | |
| params: | |
| split: test | |
| dataset_name: starvector/text2svg-stack | |
| im_size: 384 | |
| num_samples: 64 | |
| transforms: false | |
| select_dataset_name: false | |
| image_processor: siglip_384 | |
| generation: | |
| max_length: 10000 | |
| min_length: 10 | |
| num_beams: 3 | |
| temperature: 1.0 | |
| num_captions: 1 | |
| repetition_penalty: 1.0 | |
| length_penalty: 0.5 | |
| top_p: 0.95 | |
| use_nucleus_sampling: true | |
| im_size: 384 | |
| dpi: 2 | |
| scale: 300 | |
| metrics: | |
| L2: false | |
| Masked-L2: false | |
| LPIPS: false | |
| SSIM: false | |
| FID: false | |
| FID_clip: false | |
| CLIPScore: true | |
| CountTokenLength: true | |
| ratio_post_processed: false | |
| ratio_non_compiling: false | |
| DinoScore: false |