@@ -515,12 +515,12 @@ <h1>Source code for torchtune.datasets._concat</h1><div class="highlight"><pre>
515
515
< span class ="k "> def</ span > < span class ="w "> </ span > < span class ="fm "> __init__</ span > < span class ="p "> (</ span > < span class ="bp "> self</ span > < span class ="p "> ,</ span > < span class ="n "> datasets</ span > < span class ="p "> :</ span > < span class ="n "> List</ span > < span class ="p "> [</ span > < span class ="n "> Dataset</ span > < span class ="p "> ]):</ span >
516
516
< span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> _datasets</ span > < span class ="p "> :</ span > < span class ="n "> List</ span > < span class ="p "> [</ span > < span class ="n "> Dataset</ span > < span class ="p "> ]</ span > < span class ="o "> =</ span > < span class ="n "> datasets</ span >
517
517
518
- < span class ="k " > for </ span > < span class ="n "> dataset</ span > < span class ="ow " > in </ span > < span class ="bp " > self </ span > < span class ="o " > . </ span > < span class ="n "> _datasets </ span > < span class ="p "> : </ span >
519
- < span class ="k "> if</ span > < span class ="nb "> isinstance </ span > < span class ="p "> (</ span > < span class ="n "> dataset </ span > < span class ="p "> , </ span > < span class ="n "> PackedDataset </ span > < span class ="p "> ):</ span >
520
- < span class ="k "> raise</ span > < span class ="ne "> ValueError</ span > < span class ="p "> (</ span >
521
- < span class ="s2 "> "ConcatDataset can't process instances of PackedDataset ."</ span >
522
- < span class ="p "> )</ span >
523
-
518
+ < span class ="n " > is_packed </ span > < span class ="o " > = </ span > < span class =" p " > [ </ span > < span class =" nb " > isinstance </ span > < span class =" p " > ( </ span > < span class =" n "> dataset</ span > < span class =" p " > , </ span > < span class ="n " > PackedDataset </ span > < span class =" p " > ) </ span > < span class ="k " > for </ span > < span class ="n " > dataset </ span > < span class ="ow " > in </ span > < span class =" n "> datasets </ span > < span class ="p "> ] </ span >
519
+ < span class ="k "> if</ span > < span class ="nb "> any </ span > < span class ="p "> (</ span > < span class ="n "> is_packed </ span > < span class ="p "> ) </ span > < span class ="ow " > and </ span > < span class =" ow " > not </ span > < span class =" nb " > all </ span > < span class =" p " > ( </ span > < span class =" n "> is_packed </ span > < span class ="p "> ):</ span >
520
+ < span class ="k "> raise</ span > < span class ="ne "> ValueError</ span > < span class ="p "> (</ span >
521
+ < span class ="s2 "> "ConcatDataset can't process a mix of packed and non-packed datasets ."</ span >
522
+ < span class ="p "> )</ span >
523
+ < span class =" bp " > self </ span > < span class =" o " > . </ span > < span class =" n " > packed </ span > < span class =" o " > = </ span > < span class =" nb " > all </ span > < span class =" p " > ( </ span > < span class =" n " > is_packed </ span > < span class =" p " > ) </ span >
524
524
< span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> _len</ span > < span class ="p "> :</ span > < span class ="nb "> int</ span > < span class ="o "> =</ span > < span class ="nb "> sum</ span > < span class ="p "> (</ span > < span class ="nb "> len</ span > < span class ="p "> (</ span > < span class ="n "> dataset</ span > < span class ="p "> )</ span > < span class ="k "> for</ span > < span class ="n "> dataset</ span > < span class ="ow "> in</ span > < span class ="n "> datasets</ span > < span class ="p "> )</ span >
525
525
< span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> _indexes</ span > < span class ="p "> :</ span > < span class ="n "> List</ span > < span class ="p "> [</ span > < span class ="n "> Tuple</ span > < span class ="p "> [</ span > < span class ="nb "> int</ span > < span class ="p "> ,</ span > < span class ="nb "> int</ span > < span class ="p "> ,</ span > < span class ="nb "> int</ span > < span class ="p "> ]]</ span > < span class ="o "> =</ span > < span class ="p "> []</ span >
526
526
0 commit comments