Spaces:

CosmoAI
/

BhagwatGeeta

Runtime error

CosmoAI commited on Mar 22, 2024

Commit

42cf287

verified ·

1 Parent(s): 64d575d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -151,8 +151,10 @@ def prepare_training_data(qa_pairs, tokenizer):
     # Here, we assume the context is a single long string.
     context = "your_bhagavad_gita_text_here"  # Replace with your preprocessed Bhagavad Gita text
     context_encoded = tokenizer(context, add_special_tokens=True, return_tensors="pt")
-    start_positions = answer_encoded.input_ids == tokenizer.convert_tokens_to_ids(tokenizer.sep_token)[0]  # Find first SEP token
-    end_positions = answer_encoded.input_ids == tokenizer.convert_tokens_to_ids(tokenizer.eos_token)[0]  # Find first EOS token
     # Combine all data into a dictionary for each QA pair
     encoded_data.append({

     # Here, we assume the context is a single long string.
     context = "your_bhagavad_gita_text_here"  # Replace with your preprocessed Bhagavad Gita text
     context_encoded = tokenizer(context, add_special_tokens=True, return_tensors="pt")
+    # start_positions = answer_encoded.input_ids == tokenizer.convert_tokens_to_ids(tokenizer.sep_token)[0]  # Find first SEP token
+      start_positions = answer_encoded.input_ids == [tokenizer.convert_tokens_to_ids(tokenizer.sep_token)[0]]
+    end_positions = answer_encoded.input_ids == [tokenizer.convert_tokens_to_ids(tokenizer.eos_token)[0]]  # Find first EOS token
     # Combine all data into a dictionary for each QA pair
     encoded_data.append({