File tree Expand file tree Collapse file tree 2 files changed +4
-4
lines changed
Expand file tree Collapse file tree 2 files changed +4
-4
lines changed Original file line number Diff line number Diff line change 11# Dataset and Dataloader
2- dataset : slimorca
3- seed : 10
2+ dataset : alpaca
3+ seed : null
44shuffle : True
55
66# Model Arguments
Original file line number Diff line number Diff line change @@ -36,7 +36,7 @@ class SlimOrcaDataset(Dataset):
3636
3737 Keyword Arguments:
3838 max_token_length (int): Maximum number of tokens in the returned.
39- Default is 4096 .
39+ Default is 1024 .
4040
4141 Data input format:
4242 [ { "from": "system", "value": "You are an AI assistant. You will be
@@ -63,7 +63,7 @@ class SlimOrcaDataset(Dataset):
6363 def __init__ (self , tokenizer : Tokenizer , ** kwargs ) -> None :
6464 self ._data = load_dataset ("Open-Orca/SlimOrca-Dedup" , split = "train" )
6565 self ._tokenizer = tokenizer
66- self ._max_token_length = kwargs .get ("max_token_length" , 4096 )
66+ self ._max_token_length = kwargs .get ("max_token_length" , 1024 )
6767 if self ._max_token_length < 4 :
6868 # Input token needs to have 1 bos, 1 eos,
6969 # and 1 token from prompt, 1 from label
You can’t perform that action at this time.
0 commit comments