@@ -22,7 +22,6 @@ def codegen(
2222 n_samples = 1 ,
2323 id_range = None ,
2424 resume = True ,
25- subsample_size = None ,
2625):
2726 with Progress (
2827 TextColumn (f"{ dataset } •" + "[progress.percentage]{task.percentage:>3.0f}%" ),
@@ -33,11 +32,7 @@ def codegen(
3332 ) as p :
3433 if dataset == "wildcodebench" :
3534 from wildcode .data import get_wildcodebench , write_jsonl
36-
3735 dataset = get_wildcodebench ()
38- if subsample_size :
39- if subsample_size < len (dataset ):
40- dataset = dataset [:subsample_size ]
4136
4237 if model .is_direct_completion () and nl2code :
4338 raise Exception ("Base model does not support direct completion for NL2Code tasks" )
@@ -112,7 +107,6 @@ def main():
112107 parser .add_argument ("--model" , required = True , type = str )
113108 parser .add_argument ("--dataset" , required = True , type = str )
114109 parser .add_argument ("--save_path" , default = None , type = str )
115- parser .add_argument ("--subsample_size" , default = None , type = int )
116110 parser .add_argument ("--nl2code" , action = 'store_true' )
117111 parser .add_argument ("--bs" , default = 1 , type = int )
118112 parser .add_argument ("--n_samples" , default = 1 , type = int )
@@ -173,7 +167,6 @@ def main():
173167 n_samples = args .n_samples ,
174168 resume = args .resume ,
175169 id_range = args .id_range ,
176- subsample_size = args .subsample_size ,
177170 )
178171
179172
0 commit comments