You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
info="Lower values make the output more deterministic, higher values increase randomness.",
273
291
)
274
292
top_p=gr.Slider(
275
293
label="Top P (Nucleus Sampling)",
276
-
minimum=0.80,
294
+
minimum=0.70,
277
295
maximum=1.0,
278
296
value=0.95, # Default from inference.py
279
297
step=0.01,
@@ -282,16 +300,16 @@ def run_inference(
282
300
cfg_filter_top_k=gr.Slider(
283
301
label="CFG Filter Top K",
284
302
minimum=15,
285
-
maximum=50,
286
-
value=30,
303
+
maximum=100,
304
+
value=45,
287
305
step=1,
288
306
info="Top k filter for CFG guidance.",
289
307
)
290
308
speed_factor_slider=gr.Slider(
291
309
label="Speed Factor",
292
310
minimum=0.8,
293
311
maximum=1.0,
294
-
value=0.94,
312
+
value=1.0,
295
313
step=0.02,
296
314
info="Adjusts the speed of the generated audio (1.0 = original speed).",
297
315
)
@@ -311,6 +329,7 @@ def run_inference(
311
329
inputs=[
312
330
text_input,
313
331
audio_prompt_input,
332
+
transcription_input,
314
333
max_new_tokens,
315
334
cfg_scale,
316
335
temperature,
@@ -330,29 +349,38 @@ def run_inference(
330
349
None,
331
350
3072,
332
351
3.0,
333
-
1.3,
352
+
1.8,
334
353
0.95,
335
-
35,
336
-
0.94,
354
+
45,
355
+
1.0,
337
356
],
338
357
[
339
358
"[S1] Open weights text to dialogue model. \n[S2] You get full control over scripts and voices. \n[S1] I'm biased, but I think we clearly won. \n[S2] Hard to disagree. (laughs) \n[S1] Thanks for listening to this demo. \n[S2] Try it now on Git hub and Hugging Face. \n[S1] If you liked our model, please give us a star and share to your friends. \n[S2] This was Nari Labs.",
0 commit comments