Add prompt for Llama-3-Instruct

tongyx361 · tongyx361 · commit e419f407b20e · 2024-08-17T19:13:32.000+08:00
diff --git a/dart_math/utils.py b/dart_math/utils.py
@@ -132,6 +132,28 @@
         # {resp}
         delim="\n\n",
     ),
+    "llama3-math": dict(  # https://llama.meta.com/docs/model-cards-and-prompt-formats/meta-llama-3
+        id="llama3-math",
+        sys_prompt=(
+            "<|begin_of_text|>"
+            # + "<|start_header_id|>system<|end_header_id|>\n\n"
+            # + "You are a helpful assistant."
+            # + "<|eot_id|>"
+        ),
+        query_prompt="<|start_header_id|>" + "user" + "<|end_header_id|>" + "\n\n",
+        # {query}
+        prompt_after_query="<|eot_id|>",
+        resp_prompt="<|start_header_id|>" + "assistant" + "<|end_header_id|>" + "\n\n",
+        prompt_before_resp="",
+        # {resp}
+        delim="<|eot_id|>" + "\n",
+        model_ids=[
+            "meta-llama--Meta-Llama-3-8B-Instruct",
+            "meta-llama--Meta-Llama-3-70B-Instruct",
+            "meta-llama--Meta-Llama-3.1-8B-Instruct",
+            "meta-llama--Meta-Llama-3.1-70B-Instruct",
+        ],
+    ),
 }
 
 
@@ -184,7 +206,13 @@ def __init__(
     def load_from_id_or_path(prompt_template: str = "alpaca") -> "PromptTemplate":
         """Load prompt template from ID or file path."""
         if prompt_template in PROMPT_TEMPLATE_ID2DICT:  # ID
-            return PromptTemplate(**PROMPT_TEMPLATE_ID2DICT[prompt_template])
+            return PromptTemplate(
+                **{
+                    k: v
+                    for k, v in PROMPT_TEMPLATE_ID2DICT[prompt_template].items()
+                    if k != "model_ids"
+                }
+            )
         elif isinstance(prompt_template, str) and os.path.exists(prompt_template):
             # File path
             stem = os.path.splitext(os.path.basename(prompt_template))[0]
@@ -216,15 +244,15 @@ def make_full_prompt(self, query: str, eg_qas: list[tuple[str, str]] = []) -> st
     @staticmethod
     def get_prompt_template_from_prompt_type_and_model(
         prompt_type: str,
-        model_name_or_path: str,
+        model_dirname: str,
     ) -> "PromptTemplate":
         """Get the prompt template suitable for the model.
 
         Parameters
         ----------
         prompt_type : str
             Prompt type, like "cot" or "tool".
-        model_name_or_path : str
+        model_dirname : str
             HF ID or path to the model.
 
         Returns
@@ -234,29 +262,31 @@ def get_prompt_template_from_prompt_type_and_model(
         """
         prompt_template = None
         if prompt_type == "cot":
-            if model_name_or_path in BASE_MODEL_IDS + MATH_SHEPHERD_MODEL_IDS:
+            if model_dirname in BASE_MODEL_IDS + MATH_SHEPHERD_MODEL_IDS:
                 prompt_template = "qa"
-            elif model_name_or_path.startswith("dart-math"):
+            elif model_dirname.startswith("dart-math"):
                 prompt_template = "alpaca"
-            elif model_name_or_path in DEEPSEEK_INSTR_MODEL_IDS:
+            elif model_dirname in DEEPSEEK_INSTR_MODEL_IDS:
                 prompt_template = "deepseekmath"
-            elif model_name_or_path.startswith("Xwin-LM/Xwin-Math"):
+            elif model_dirname.startswith("Xwin-LM/Xwin-Math"):
                 prompt_template = "xwinmath"
-            elif model_name_or_path.startswith("TIGER-Lab--MAmmoTH2"):
+            elif model_dirname.startswith("TIGER-Lab--MAmmoTH2"):
                 prompt_template = "mammoth2-cot"
+            elif model_dirname in PROMPT_TEMPLATE_ID2DICT["llama3-math"]["model_ids"]:
+                prompt_template = "llama3-math"
             else:  # default
                 prompt_template = "alpaca"
         elif prompt_type == "tool":
-            if model_name_or_path in DEEPSEEK_INSTR_MODEL_IDS:
+            if model_dirname in DEEPSEEK_INSTR_MODEL_IDS:
                 prompt_template = "deepseekmath-tool"
 
         if prompt_template is None:
             raise ValueError(
-                f"Unknown prompt type {prompt_type} for model {model_name_or_path}."
+                f"Unknown prompt type {prompt_type} for model {model_dirname}."
             )
 
         prompt_template = PromptTemplate.load_from_id_or_path(prompt_template)
-        if "MMIQC" in model_name_or_path:
+        if "MMIQC" in model_dirname:
             prompt_template.prompt_before_resp = (
                 'Please solve the following problem and put your answer at the end with "The answer is: ".'
                 + " "
diff --git a/pipeline/gen.ipynb b/pipeline/gen.ipynb
@@ -303,7 +303,7 @@
     "\n",
     "prompt_template = (\n",
     "    PromptTemplate.get_prompt_template_from_prompt_type_and_model(\n",
-    "        prompt_type=args.prompt_template, model_name_or_path=model_dirname\n",
+    "        prompt_type=args.prompt_template, model_dirname=model_dirname\n",
     "    )\n",
     "    if args.prompt_template in [\"cot\", \"tool\"]\n",
     "    else PromptTemplate.load_from_id_or_path(args.prompt_template)\n",
diff --git a/pipeline/gen.py b/pipeline/gen.py
@@ -208,7 +208,7 @@
 
     prompt_template = (
         PromptTemplate.get_prompt_template_from_prompt_type_and_model(
-            prompt_type=args.prompt_template, model_name_or_path=model_dirname
+            prompt_type=args.prompt_template, model_dirname=model_dirname
         )
         if args.prompt_template in ["cot", "tool"]
         else PromptTemplate.load_from_id_or_path(args.prompt_template)

Original file line number	Diff line number	Diff line change
`@@ -208,7 +208,7 @@`
`208`	`208`
`209`	`209`	`prompt_template = (`
`210`	`210`	`PromptTemplate.get_prompt_template_from_prompt_type_and_model(`
`211`		`- prompt_type=args.prompt_template, model_name_or_path=model_dirname`
	`211`	`+ prompt_type=args.prompt_template, model_dirname=model_dirname`
`212`	`212`	`)`
`213`	`213`	`if args.prompt_template in ["cot", "tool"]`
`214`	`214`	`else PromptTemplate.load_from_id_or_path(args.prompt_template)`