@@ -597,18 +597,26 @@ def validate_args(args):
597
597
parser .add_argument (
598
598
"--prefix-len" ,
599
599
type = int ,
600
- default = 0 ,
601
- help = "Number of fixed prefix tokens before the random "
602
- "context in a request (default: 0)." ,
603
- )
600
+ default = None ,
601
+ help = f"Number of prefix tokens to be used in RandomDataset "
602
+ "and SonnetDataset. For RandomDataset, the total input "
603
+ "length is the sum of prefix-len (default: "
604
+ f"{ RandomDataset .DEFAULT_PREFIX_LEN } ) and a random context length "
605
+ "sampled from [input_len * (1 - range_ratio), "
606
+ "input_len * (1 + range_ratio)]. For SonnetDataset, "
607
+ f"prefix_len (default: { SonnetDataset .DEFAULT_PREFIX_LEN } ) "
608
+ "controls how much of the input is fixed lines versus "
609
+ "random lines, but the total input length remains approximately "
610
+ "input_len tokens." )
604
611
# random dataset
605
612
parser .add_argument (
606
613
"--random-range-ratio" ,
607
614
type = float ,
608
- default = 0.0 ,
609
- help = "Range ratio for sampling input/output length, "
610
- "used only for RandomDataset. Must be in the range [0, 1) to define "
611
- "a symmetric sampling range "
615
+ default = None ,
616
+ help = f"Range ratio (default : { RandomDataset .DEFAULT_RANGE_RATIO } ) "
617
+ "for sampling input/output length, "
618
+ "used only for RandomDataset. Must be in the range [0, 1) to "
619
+ "define a symmetric sampling range "
612
620
"[length * (1 - range_ratio), length * (1 + range_ratio)]." ,
613
621
)
614
622
0 commit comments