Kai Wu 1 tahun lalu
induk
melakukan
ca74a840f9
1 mengubah file dengan 1 tambahan dan 1 penghapusan
  1. 1 1
      recipes/finetuning/datasets/raft_dataset.py

+ 1 - 1
recipes/finetuning/datasets/raft_dataset.py

@@ -88,7 +88,7 @@ def raft_tokenize(q_a_pair, tokenizer):
     return tokenize_dialog(chat, tokenizer)
 
 
-def get_custom_dataset(dataset_config, tokenizer, split, split_ratio=0.8):
+def get_custom_dataset(dataset_config, tokenizer, split, split_ratio=0.9):
     # load_dataset will return DatasetDict that contains all the data in the train set
     dataset_dict = load_dataset('json', data_files=dataset_config.data_path)
     dataset = dataset_dict['train']