Kai Wu 1 年之前
父节点
当前提交
ca74a840f9
共有 1 个文件被更改,包括 1 次插入1 次删除
  1. 1 1
      recipes/finetuning/datasets/raft_dataset.py

+ 1 - 1
recipes/finetuning/datasets/raft_dataset.py

@@ -88,7 +88,7 @@ def raft_tokenize(q_a_pair, tokenizer):
     return tokenize_dialog(chat, tokenizer)
 
 
-def get_custom_dataset(dataset_config, tokenizer, split, split_ratio=0.8):
+def get_custom_dataset(dataset_config, tokenizer, split, split_ratio=0.9):
     # load_dataset will return DatasetDict that contains all the data in the train set
     dataset_dict = load_dataset('json', data_files=dataset_config.data_path)
     dataset = dataset_dict['train']