Spaces:

sakaltcommunity
/

Pythiajapneser

Sleeping

Sakalti commited on Oct 10, 2024

Commit

2661f41

verified ·

1 Parent(s): 1cd0800

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -12,12 +12,12 @@ def train_and_deploy(write_token, repo_name, license_text):
         f.write(license_text)
     # モデルとトークナイザーの読み込み
-    model_name = "HuggingfaceH4/zephyr-7b-beta"  # トレーニング対象のモデル
     model = AutoModelForCausalLM.from_pretrained(model_name)
     tokenizer = AutoTokenizer.from_pretrained(model_name)
     # 日本語データセットの読み込み
-    dataset = load_dataset("Sakalti/hachiwari")
     # データセットのトークン化
     def tokenize_function(examples):

         f.write(license_text)
     # モデルとトークナイザーの読み込み
+    model_name = "Sakalti/iturkaAI-large"  # トレーニング対象のモデル
     model = AutoModelForCausalLM.from_pretrained(model_name)
     tokenizer = AutoTokenizer.from_pretrained(model_name)
     # 日本語データセットの読み込み
+    dataset = load_dataset("range3/cc100-ja")
     # データセットのトークン化
     def tokenize_function(examples):