danhtran2mind
/

Qwen-3-0.6B-Instruct-Vi-Medical-LoRA

@@ -179,8 +179,8 @@
     "import os\n",
     "api = HfApi()\n",
     "\n",
-    "repo_id = \"heboya8/Qwen-3-0.6B-it-Medical-LoRA\"\n",
-    "save_path = \"Qwen-3-0.6B-it-Medical-LoRA\"\n",
     "\n",
     "# Create the directory if it doesn't exist\n",
     "os.makedirs(save_path, exist_ok=True)\n",
@@ -519,7 +519,7 @@
    "outputs": [],
    "source": [
     "arguments = TrainingArguments(  \n",
-    "                resume_from_checkpoint=\"./Qwen-3-0.6B-it-Medical-LoRA\",\n",
     "                per_device_train_batch_size=8,  \n",
     "                per_device_eval_batch_size=8,  \n",
     "                gradient_accumulation_steps=4,  \n",
@@ -540,7 +540,7 @@
     "                weight_decay=0.01,  \n",
     "                lr_scheduler_type=\"linear\",  \n",
     "                seed=42,  \n",
-    "                output_dir=\"Qwen-3-0.6B-it-Medical-LoRA\",  \n",
     "                report_to=\"none\",\n",
     "                load_best_model_at_end=True,  # Load weights with lowest val loss\n",
     "        \t\tgreater_is_better=False,\n",
@@ -622,7 +622,7 @@
     }
    ],
    "source": [
-    "!ls -a Qwen-3-0.6B-it-Medical-LoRA"
    ]
   },
   {
@@ -838,8 +838,8 @@
    },
    "outputs": [],
    "source": [
-    "model.save_pretrained(\"./Qwen-3-0.6B-it-Medical-LoRA\")  # Local saving\n",
-    "tokenizer.save_pretrained(\"./Qwen-3-0.6B-it-Medical-LoRA\")"
    ]
   },
   {

     "import os\n",
     "api = HfApi()\n",
     "\n",
+    "repo_id = \"danhtran2mind/Qwen-3-0.6B-Instruct-Vi-Medical-LoRA\"\n",
+    "save_path = \"Qwen-3-0.6B-Instruct-Vi-Medical-LoRA\"\n",
     "\n",
     "# Create the directory if it doesn't exist\n",
     "os.makedirs(save_path, exist_ok=True)\n",
    "outputs": [],
    "source": [
     "arguments = TrainingArguments(  \n",
+    "                resume_from_checkpoint=\"./Qwen-3-0.6B-Instruct-Vi-Medical-LoRA\",\n",
     "                per_device_train_batch_size=8,  \n",
     "                per_device_eval_batch_size=8,  \n",
     "                gradient_accumulation_steps=4,  \n",
     "                weight_decay=0.01,  \n",
     "                lr_scheduler_type=\"linear\",  \n",
     "                seed=42,  \n",
+    "                output_dir=\"Qwen-3-0.6B-Instruct-Vi-Medical-LoRA\",  \n",
     "                report_to=\"none\",\n",
     "                load_best_model_at_end=True,  # Load weights with lowest val loss\n",
     "        \t\tgreater_is_better=False,\n",
     }
    ],
    "source": [
+    "!ls -a Qwen-3-0.6B-Instruct-Vi-Medical-LoRA"
    ]
   },
   {
    },
    "outputs": [],
    "source": [
+    "model.save_pretrained(\"./Qwen-3-0.6B-Instruct-Vi-Medical-LoRA\")  # Local saving\n",
+    "tokenizer.save_pretrained(\"./Qwen-3-0.6B-Instruct-Vi-Medical-LoRA\")"
    ]
   },
   {