Skip to content

Commit a18b41e

Browse files
committed
chore: training args init
1 parent 47ca822 commit a18b41e

File tree

1 file changed

+7
-7
lines changed

1 file changed

+7
-7
lines changed

train.ipynb

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -119,7 +119,7 @@
119119
"DATASETS_REPO_ID = \"ryanlinjui/menu-zh-TW\" # set your dataset repo id for training\n",
120120
"PRETRAINED_MODEL_REPO_ID = \"naver-clova-ix/donut-base\" # set your pretrained model repo id for fine-tuning\n",
121121
"TASK_PROMPT_NAME = \"<s_menu-text-detection>\" # set your task prompt name for training\n",
122-
"MAX_LENGTH = 1024 # set your max length for maximum output length, max to 1536 for donut-base\n",
122+
"MAX_LENGTH = 768 # set your max length for maximum output length, max to 1536 for donut-base\n",
123123
"IMAGE_SIZE = [1280, 960] # set your image size for training\n",
124124
"\n",
125125
"register_heif_opener()\n",
@@ -185,7 +185,7 @@
185185
"\n",
186186
"HUGGINGFACE_MODEL_ID = \"ryanlinjui/donut-base-finetuned-menu\" # set your huggingface model repo id for saving / pushing to the hub\n",
187187
"EPOCHS = 100 # set your training epochs\n",
188-
"TRAIN_BATCH_SIZE = 1 # set your training batch size\n",
188+
"TRAIN_BATCH_SIZE = 8 # set your training batch size\n",
189189
"LEARNING_RATE = 3e-5 # set your learning rate\n",
190190
"WEIGHT_DECAY = 0.1 # set your weight decay\n",
191191
"\n",
@@ -231,17 +231,17 @@
231231
" per_device_eval_batch_size=1,\n",
232232
" output_dir=\"./.checkpoints\",\n",
233233
" seed=42,\n",
234-
" warmup_steps=30,\n",
234+
" warmup_steps=300,\n",
235235
" eval_strategy=\"steps\",\n",
236-
" eval_steps=200,\n",
236+
" eval_steps=1000,\n",
237237
" fp16=(device == \"cuda\"),\n",
238238
" predict_with_generate=True,\n",
239239
" generation_max_length=MAX_LENGTH,\n",
240240
" generation_num_beams=1,\n",
241241
" logging_strategy=\"steps\",\n",
242242
" logging_steps=50,\n",
243243
" save_strategy=\"steps\",\n",
244-
" save_steps=200,\n",
244+
" save_steps=1000,\n",
245245
" push_to_hub=True if HUGGINGFACE_MODEL_ID else False,\n",
246246
" hub_model_id=HUGGINGFACE_MODEL_ID,\n",
247247
" hub_strategy=\"every_save\",\n",
@@ -272,7 +272,7 @@
272272
"\n",
273273
"MODEL_REPO_ID = \"ryanlinjui/donut-base-finetuned-menu\"\n",
274274
"TASK_PROMPT_NAME = \"<s_menu-text-detection>\"\n",
275-
"MAX_LENGTH = 1024\n",
275+
"MAX_LENGTH = 768\n",
276276
"IMAGE_SIZE = [1280, 960]\n",
277277
"\n",
278278
"processor = DonutProcessor.from_pretrained(MODEL_REPO_ID)\n",
@@ -306,7 +306,7 @@
306306
],
307307
"metadata": {
308308
"kernelspec": {
309-
"display_name": ".venv",
309+
"display_name": "menu-text-detection",
310310
"language": "python",
311311
"name": "python3"
312312
},

0 commit comments

Comments
 (0)