Add config files

Murhaf · web-flow · commit df9b4e256ef5 · 2024-03-27T16:27:48.000+01:00
diff --git a/configs/t5_gold_synthetic.json b/configs/t5_gold_synthetic.json
@@ -0,0 +1,43 @@
+
+{
+    "output_dir": "T5-MSAizer-full",
+    "dataset_name": "Murhaf/dialect_msa_silver_parallel",
+    "model_name": "UBC-NLP/AraT5v2-base-1024",
+    "model_revision": "main",
+    "source_prefix": "ترجمة للفصحى: ",
+
+    "source_column": "source",
+    "target_column": "target",
+
+    "overwrite_output_dir": true,
+    "do_train": true,
+    "do_eval": true,
+    "do_predict": false,
+
+    "max_source_length": 1024,
+    "max_target_length": 1024,
+    "generation_max_length": 512,
+
+    "learning_rate": 2e-5,
+    "weight_decay": 0.0001,
+    "warmup_ratio": 0.05,
+    "gradient_accumulation_steps": 1,
+    "num_train_epochs": 1,
+    "per_device_train_batch_size": 32,
+    "per_device_eval_batch_size": 32,
+
+    "evaluation_strategy": "steps",
+    "eval_steps": 0.1,
+    "save_total_limit": 3,
+    "predict_with_generate": true,
+    "hub_strategy": "end",
+    "hub_private_repo": true,
+    "report_to": "wandb",
+    "logging_steps": 1,
+
+    "push_to_hub": true,
+    "token": "",
+    "hub_token": "",
+    "per_gpu_train_batch_size": null,
+    "per_gpu_eval_batch_size": null
+  }