smhavens commited on
Commit
7bf917c
·
1 Parent(s): 7faffe5

Bug found: train_data was used for loop and must be everything

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -52,7 +52,7 @@ def training():
52
  # small_eval_dataset = tokenized_datasets["test"].shuffle(seed=42).select(range(1000))
53
 
54
  train_examples = []
55
- train_data = dataset['train']['text']
56
  # For agility we only 1/2 of our available data
57
  n_examples = dataset['train'].num_rows // 2
58
 
@@ -60,7 +60,7 @@ def training():
60
 
61
  for i in range(n_examples):
62
  example = train_data[i]
63
- print(example)
64
  train_examples.append(InputExample(texts=[example['id'], example['text']]))
65
 
66
  # train_dataloader = DataLoader(train_examples, shuffle=True, batch_size=16)
 
52
  # small_eval_dataset = tokenized_datasets["test"].shuffle(seed=42).select(range(1000))
53
 
54
  train_examples = []
55
+ train_data = dataset['train']
56
  # For agility we only 1/2 of our available data
57
  n_examples = dataset['train'].num_rows // 2
58
 
 
60
 
61
  for i in range(n_examples):
62
  example = train_data[i]
63
+ # print(example)
64
  train_examples.append(InputExample(texts=[example['id'], example['text']]))
65
 
66
  # train_dataloader = DataLoader(train_examples, shuffle=True, batch_size=16)