diff --git a/segm/config/20240604211922-ade20k-seg_base_deit_linear-variant.yml b/segm/config/20240604211922-ade20k-seg_base_deit_linear-variant.yml new file mode 100644 index 0000000..2d4c3e3 --- /dev/null +++ b/segm/config/20240604211922-ade20k-seg_base_deit_linear-variant.yml @@ -0,0 +1,58 @@ +algorithm_kwargs: + batch_size: 1 + eval_freq: 1 + num_epochs: 64 + start_epoch: 0 +amp: false +dataset_kwargs: + batch_size: 1 + crop_size: 512 + dataset: ade20k + image_size: 512 + normalization: deit + num_workers: 10 + re_mode: pixel + split: train +debug: false +inference_kwargs: + im_size: 512 + window_size: 512 + window_stride: 512 +net_kwargs: + backbone: vit_deit_base_distilled_patch16_384 + d_model: 768 + decoder: + n_cls: 150 + name: linear + distilled: true + drop_path_rate: 0.1 + dropout: 0.0 + image_size: !!python/tuple + - 512 + - 512 + mlp_ratio: 4 + n_cls: 150 + n_heads: 12 + n_layers: 12 + normalization: deit + patch_size: 16 +optimizer_kwargs: + clip_grad: null + cooldown_epochs: 10 + decay_rate: 0.1 + epochs: 64 + iter_max: 161728 + lr: 0.001 + min_lr: 1.0e-05 + momentum: 0.9 + opt: sgd + poly_power: 0.9 + poly_step_size: 1 + sched: polynomial + warmup_epochs: 0 + warmup_lr: 1.0e-06 + weight_decay: 0.0 +resume: true +seed: 2 +version: normal +world_batch_size: 8 diff --git a/segm/config/20240604211922-ade20k-seg_base_deit_mask-variant.yml b/segm/config/20240604211922-ade20k-seg_base_deit_mask-variant.yml new file mode 100644 index 0000000..341d837 --- /dev/null +++ b/segm/config/20240604211922-ade20k-seg_base_deit_mask-variant.yml @@ -0,0 +1,58 @@ +algorithm_kwargs: + batch_size: 1 + eval_freq: 2 + num_epochs: 64 + start_epoch: 18 +amp: false +dataset_kwargs: + batch_size: 1 + crop_size: 512 + dataset: ade20k + image_size: 512 + normalization: deit + num_workers: 10 + re_mode: pixel + split: train +debug: false +inference_kwargs: + im_size: 512 + window_size: 512 + window_stride: 512 +net_kwargs: + backbone: vit_deit_base_distilled_patch16_384 + d_model: 768 + decoder: + drop_path_rate: 0.0 + dropout: 0.1 + n_cls: 150 + n_layers: 2 + name: mask_transformer_l2.u1.d768 + distilled: true + drop_path_rate: 0.1 + dropout: 0.0 + image_size: !!python/tuple + - 512 + - 512 + mlp_ratio: 4 + n_cls: 150 + n_heads: 12 + n_layers: 12 + normalization: deit + patch_size: 16 +optimizer_kwargs: + clip_grad: null + epochs: 64 + iter_max: 161728 + iter_warmup: 0.0 + lr: 0.001 + min_lr: 1.0e-05 + momentum: 0.9 + opt: sgd + poly_power: 0.9 + poly_step_size: 1 + sched: polynomial + weight_decay: 0.0 +resume: true +seed: 3 +version: normal +world_batch_size: 8 diff --git a/segm/config/20240604211922-ade20k-seg_base_mask-variant.yml b/segm/config/20240604211922-ade20k-seg_base_mask-variant.yml new file mode 100644 index 0000000..07fa571 --- /dev/null +++ b/segm/config/20240604211922-ade20k-seg_base_mask-variant.yml @@ -0,0 +1,55 @@ +algorithm_kwargs: + batch_size: 1 + eval_freq: 2 + num_epochs: 64 + start_epoch: 0 +amp: false +dataset_kwargs: + batch_size: 1 + crop_size: 512 + dataset: ade20k + image_size: 512 + normalization: vit + num_workers: 10 + split: train +debug: false +inference_kwargs: + im_size: 512 + window_size: 512 + window_stride: 512 +net_kwargs: + backbone: vit_base_patch16_384 + d_model: 768 + decoder: + drop_path_rate: 0.0 + dropout: 0.1 + n_cls: 150 + n_layers: 2 + name: mask_transformer + distilled: false + drop_path_rate: 0.1 + dropout: 0.0 + image_size: !!python/tuple + - 512 + - 512 + n_cls: 150 + n_heads: 12 + n_layers: 12 + normalization: vit + patch_size: 16 +optimizer_kwargs: + clip_grad: null + epochs: 64 + iter_max: 161728 + iter_warmup: 0.0 + lr: 0.001 + min_lr: 1.0e-05 + momentum: 0.9 + opt: sgd + poly_power: 0.9 + poly_step_size: 1 + sched: polynomial + weight_decay: 0.0 +resume: true +version: normal +world_batch_size: 8 diff --git a/segm/config/20240604211922-ade20k-seg_small_mask-variant.yml b/segm/config/20240604211922-ade20k-seg_small_mask-variant.yml new file mode 100644 index 0000000..3c3e587 --- /dev/null +++ b/segm/config/20240604211922-ade20k-seg_small_mask-variant.yml @@ -0,0 +1,55 @@ +algorithm_kwargs: + batch_size: 2 + eval_freq: 2 + num_epochs: 64 + start_epoch: 0 +amp: false +dataset_kwargs: + batch_size: 2 + crop_size: 512 + dataset: ade20k + image_size: 512 + normalization: vit + num_workers: 10 + split: train +debug: false +inference_kwargs: + im_size: 512 + window_size: 512 + window_stride: 512 +net_kwargs: + backbone: vit_small_patch16_384 + d_model: 384 + decoder: + drop_path_rate: 0.0 + dropout: 0.1 + n_cls: 150 + n_layers: 2 + name: mask_transformer + distilled: false + drop_path_rate: 0.1 + dropout: 0.0 + image_size: !!python/tuple + - 512 + - 512 + n_cls: 150 + n_heads: 6 + n_layers: 12 + normalization: vit + patch_size: 16 +optimizer_kwargs: + clip_grad: null + epochs: 64 + iter_max: 161728 + iter_warmup: 0.0 + lr: 0.001 + min_lr: 1.0e-05 + momentum: 0.9 + opt: sgd + poly_power: 0.9 + poly_step_size: 1 + sched: polynomial + weight_decay: 0.0 +resume: true +version: normal +world_batch_size: 8 diff --git a/segm/config/20240604211922-ade20k-seg_tiny_mask-variant.yml b/segm/config/20240604211922-ade20k-seg_tiny_mask-variant.yml new file mode 100644 index 0000000..bd04718 --- /dev/null +++ b/segm/config/20240604211922-ade20k-seg_tiny_mask-variant.yml @@ -0,0 +1,55 @@ +algorithm_kwargs: + batch_size: 2 + eval_freq: 2 + num_epochs: 64 + start_epoch: 0 +amp: false +dataset_kwargs: + batch_size: 2 + crop_size: 512 + dataset: ade20k + image_size: 512 + normalization: vit + num_workers: 10 + split: train +debug: false +inference_kwargs: + im_size: 512 + window_size: 512 + window_stride: 512 +net_kwargs: + backbone: vit_tiny_patch16_384 + d_model: 192 + decoder: + drop_path_rate: 0.0 + dropout: 0.1 + n_cls: 150 + n_layers: 2 + name: mask_transformer + distilled: false + drop_path_rate: 0.1 + dropout: 0.0 + image_size: !!python/tuple + - 512 + - 512 + n_cls: 150 + n_heads: 3 + n_layers: 12 + normalization: vit + patch_size: 16 +optimizer_kwargs: + clip_grad: null + epochs: 64 + iter_max: 161728 + iter_warmup: 0.0 + lr: 0.001 + min_lr: 1.0e-05 + momentum: 0.9 + opt: sgd + poly_power: 0.9 + poly_step_size: 1 + sched: polynomial + weight_decay: 0.0 +resume: true +version: normal +world_batch_size: 8 diff --git a/segm/config/20240604211922-cityscapes-seg_large_mask.yml b/segm/config/20240604211922-cityscapes-seg_large_mask.yml new file mode 100644 index 0000000..eda3307 --- /dev/null +++ b/segm/config/20240604211922-cityscapes-seg_large_mask.yml @@ -0,0 +1,53 @@ +algorithm_kwargs: + batch_size: 1 + eval_freq: 8 + num_epochs: 216 + start_epoch: 214 +amp: false +dataset_kwargs: + batch_size: 1 + crop_size: 768 + dataset: cityscapes + image_size: 1024 + normalization: vit + num_workers: 10 + split: train +inference_kwargs: + im_size: 1024 + window_size: 768 + window_stride: 512 +net_kwargs: + backbone: vit_large_patch16_384 + d_model: 1024 + decoder: + drop_path_rate: 0.0 + dropout: 0.1 + n_cls: 19 + n_layers: 1 + name: mask_transformer + drop_path_rate: 0.1 + dropout: 0.0 + image_size: !!python/tuple + - 768 + - 768 + n_cls: 19 + n_heads: 16 + n_layers: 24 + normalization: vit + patch_size: 16 +optimizer_kwargs: + clip_grad: null + epochs: 216 + iter_max: 80352 + iter_warmup: 0.0 + lr: 0.01 + min_lr: 1.0e-05 + momentum: 0.9 + opt: sgd + poly_power: 0.9 + poly_step_size: 1 + sched: polynomial + weight_decay: 0.0 +resume: true +version: normal +world_batch_size: 8