@@ -172,10 +172,10 @@ class DataTrainingArguments:
172172 """
173173
174174 dataset_name : Optional [str ] = field (
175- default = "ought /raft" , metadata = {"help" : "The name of the dataset to use (via the datasets library)." }
175+ default = "regisss /raft" , metadata = {"help" : "The name of the dataset to use (via the datasets library)." }
176176 )
177177 dataset_config_name : Optional [str ] = field (
178- default = "twitter_complaints " ,
178+ default = "default " ,
179179 metadata = {"help" : "The configuration name of the dataset to use (via the datasets library)." },
180180 )
181181 max_eval_samples : Optional [int ] = field (
@@ -250,11 +250,11 @@ def main():
250250 streaming = data_args .streaming ,
251251 trust_remote_code = model_args .trust_remote_code ,
252252 )
253- if data_args .dataset_name == "ought /raft" and data_args .dataset_config_name == "twitter_complaints " :
254- text_column = "Tweet text "
253+ if data_args .dataset_name == "regisss /raft" and data_args .dataset_config_name == "default " :
254+ text_column = "Abstract Note "
255255 label_column = "text_label"
256256 else :
257- raise ValueError ("preprocess is only for ought /raft twitter_complaints now" )
257+ raise ValueError ("preprocess is only for regisss /raft default now" )
258258 classes = [k .replace ("_" , " " ) for k in dataset ["train" ].features ["Label" ].names ]
259259 dataset = dataset .map (
260260 lambda x : {"text_label" : [classes [label ] for label in x ["Label" ]]},
0 commit comments