Fix keyword argument invokation

This commit is contained in:
Chime Ogbuji 2024-11-03 20:26:15 -05:00
parent 04cf93df55
commit e477060a00

View File

@ -194,10 +194,20 @@ def load_custom_hf_dataset(args, tokenizer: PreTrainedTokenizer):
valid_split = hf_args.get("valid_split", "train[-10%:]") valid_split = hf_args.get("valid_split", "train[-10%:]")
text_f, prompt_f, completion_f, chat_f = get_hf_custom_features(hf_args) text_f, prompt_f, completion_f, chat_f = get_hf_custom_features(hf_args)
train = create_hf_dataset( train = create_hf_dataset(
ds_name, text_f, prompt_f, completion_f, chat_f, split=train_split dataset_name=ds_name,
text_feature=text_f,
prompt_feature=prompt_f,
completion_feature=completion_f,
chat_feature=chat_f,
split=train_split,
) )
valid = create_hf_dataset( valid = create_hf_dataset(
ds_name, text_f, prompt_f, completion_f, chat_f, split=valid_split dataset_name=ds_name,
text_feature=text_f,
prompt_feature=prompt_f,
completion_feature=completion_f,
chat_feature=chat_f,
split=valid_split,
) )
return train, valid return train, valid
@ -219,11 +229,11 @@ def load_custom_hf_dataset(args, tokenizer: PreTrainedTokenizer):
train, valid = [], [] train, valid = [], []
if args.test: if args.test:
test = create_hf_dataset( test = create_hf_dataset(
dataset_name, dataset_name=dataset_name,
text_feature, text_feature=text_feature,
prompt_feature, prompt_feature=prompt_feature,
completion_feature, completion_feature=completion_feature,
chat_f, chat_feature=chat_f,
split=hf_args.get("test_split"), split=hf_args.get("test_split"),
) )
else: else: