Kai Wu 1 gadu atpakaļ
vecāks
revīzija
ca74a840f9
1 mainītis faili ar 1 papildinājumiem un 1 dzēšanām
  1. 1 1
      recipes/finetuning/datasets/raft_dataset.py

+ 1 - 1
recipes/finetuning/datasets/raft_dataset.py

@@ -88,7 +88,7 @@ def raft_tokenize(q_a_pair, tokenizer):
     return tokenize_dialog(chat, tokenizer)
     return tokenize_dialog(chat, tokenizer)
 
 
 
 
-def get_custom_dataset(dataset_config, tokenizer, split, split_ratio=0.8):
+def get_custom_dataset(dataset_config, tokenizer, split, split_ratio=0.9):
     # load_dataset will return DatasetDict that contains all the data in the train set
     # load_dataset will return DatasetDict that contains all the data in the train set
     dataset_dict = load_dataset('json', data_files=dataset_config.data_path)
     dataset_dict = load_dataset('json', data_files=dataset_config.data_path)
     dataset = dataset_dict['train']
     dataset = dataset_dict['train']