7474MODEL_ID = "nvidia/nemotron-3-nano-30b-a3b"
7575
7676# We choose this alias to be descriptive for our use case.
77- MODEL_ALIAS = "nemotron-nano-v2"
78-
79- # This sets reasoning to False for the nemotron-nano-v2 model.
80- SYSTEM_PROMPT = "/no_think"
77+ MODEL_ALIAS = "nemotron-nano-v3"
8178
8279model_configs = [
8380 ModelConfig (
8481 alias = MODEL_ALIAS ,
8582 model = MODEL_ID ,
8683 provider = MODEL_PROVIDER ,
8784 inference_parameters = ChatCompletionInferenceParams (
88- temperature = 0.5 ,
85+ temperature = 1.0 ,
8986 top_p = 1.0 ,
90- max_tokens = 1024 ,
87+ max_tokens = 2048 ,
88+ extra_body = {"chat_template_kwargs" : {"enable_thinking" : False }},
9189 ),
9290 )
9391]
@@ -286,7 +284,6 @@ class ProductReview(BaseModel):
286284 "related to '{{ product_subcategory }}'. The target age range of the ideal customer is "
287285 "{{ target_age_range }} years old. The product should be priced between $10 and $1000."
288286 ),
289- system_prompt = SYSTEM_PROMPT ,
290287 output_format = Product ,
291288 model_alias = MODEL_ALIAS ,
292289 )
@@ -304,12 +301,12 @@ class ProductReview(BaseModel):
304301 "Imagine your name is {{ customer_name }} and you are from {{ customer.city }}, {{ customer.state }}. "
305302 "Write the review in a style that is '{{ review_style }}'."
306303 "{% if target_age_range == '18-25' %}"
307- "Make sure the review is more informal and conversational."
304+ "Make sure the review is more informal and conversational.\n "
308305 "{% else %}"
309- "Make sure the review is more formal and structured."
306+ "Make sure the review is more formal and structured.\n "
310307 "{% endif %}"
308+ "The review field should contain only the review, no other text."
311309 ),
312- system_prompt = SYSTEM_PROMPT ,
313310 output_format = ProductReview ,
314311 model_alias = MODEL_ALIAS ,
315312 )
0 commit comments