mtasic85 commited on
Commit
ad7223b
·
1 Parent(s): 9c11de1

cpt core 4

Browse files
Files changed (1) hide show
  1. scripts/cpt_core_model_4.py +4 -0
scripts/cpt_core_model_4.py CHANGED
@@ -4,6 +4,7 @@ from unsloth import FastLanguageModel
4
  import torch
5
  from transformers import AutoTokenizer
6
 
 
7
  os.environ['WANDB_PROJECT'] = 'tangled-alpha-0.9-core'
8
  run_name = 'cpt-core-4'
9
 
@@ -15,6 +16,7 @@ load_in_4bit = False
15
  model_name = '../out/pretrain-core-3/hf'
16
  output_dir = '../out/cpt-core-4'
17
 
 
18
  #
19
  # model
20
  #
@@ -53,6 +55,7 @@ model = FastLanguageModel.get_peft_model(
53
  )
54
  # print(f'{model=}')
55
 
 
56
  #
57
  # dataset
58
  #
@@ -76,6 +79,7 @@ def unlsoth_generator():
76
  train_dataset = Dataset.from_generator(unlsoth_generator)
77
  dataset = train_dataset.train_test_split(test_size=0.01)
78
 
 
79
  #
80
  # trainer
81
  #
 
4
  import torch
5
  from transformers import AutoTokenizer
6
 
7
+
8
  os.environ['WANDB_PROJECT'] = 'tangled-alpha-0.9-core'
9
  run_name = 'cpt-core-4'
10
 
 
16
  model_name = '../out/pretrain-core-3/hf'
17
  output_dir = '../out/cpt-core-4'
18
 
19
+
20
  #
21
  # model
22
  #
 
55
  )
56
  # print(f'{model=}')
57
 
58
+
59
  #
60
  # dataset
61
  #
 
79
  train_dataset = Dataset.from_generator(unlsoth_generator)
80
  dataset = train_dataset.train_test_split(test_size=0.01)
81
 
82
+
83
  #
84
  # trainer
85
  #