Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -14,20 +14,20 @@ def load_tokenizer(tokenizer_choice):
|
|
14 |
"aranizer_sp64k": aranizer_sp64k.get_tokenizer(),
|
15 |
"aranizer_sp86k": aranizer_sp86k.get_tokenizer(),
|
16 |
}
|
17 |
-
|
18 |
return tokenizer_map.get(tokenizer_choice, None)
|
19 |
|
20 |
def tokenize_and_encode_and_embed(text, tokenizer_choice):
|
21 |
-
tokenizer =
|
22 |
if tokenizer:
|
23 |
# Example methods. Replace with actual methods from your tokenizer
|
24 |
tokens = tokenizer.tokenize(text)
|
25 |
encoded_output = tokenizer.encode(text, add_special_tokens=True)
|
26 |
decoded_text = tokenizer.decode(encoded_output)
|
27 |
-
|
28 |
# Example embedding (replace with actual embedding generation from your model)
|
29 |
embeddings = [random() for _ in range(10)] # Example 10-dimensional embedding vector
|
30 |
-
|
31 |
return " ".join(tokens), str(encoded_output), decoded_text, embeddings
|
32 |
else:
|
33 |
return "Tokenizer not loaded correctly", "", "", []
|
@@ -48,4 +48,4 @@ demo = gr.Interface(
|
|
48 |
description="حدد نوع المحلل اللفظي وأدخل نصًا لرؤية النتائج ومتجه التضمين.",
|
49 |
)
|
50 |
|
51 |
-
demo.launch()
|
|
|
14 |
"aranizer_sp64k": aranizer_sp64k.get_tokenizer(),
|
15 |
"aranizer_sp86k": aranizer_sp86k.get_tokenizer(),
|
16 |
}
|
17 |
+
|
18 |
return tokenizer_map.get(tokenizer_choice, None)
|
19 |
|
20 |
def tokenize_and_encode_and_embed(text, tokenizer_choice):
|
21 |
+
tokenizer = load_tokenizer(tokenizer_choice) # Use load_tokenizer here
|
22 |
if tokenizer:
|
23 |
# Example methods. Replace with actual methods from your tokenizer
|
24 |
tokens = tokenizer.tokenize(text)
|
25 |
encoded_output = tokenizer.encode(text, add_special_tokens=True)
|
26 |
decoded_text = tokenizer.decode(encoded_output)
|
27 |
+
|
28 |
# Example embedding (replace with actual embedding generation from your model)
|
29 |
embeddings = [random() for _ in range(10)] # Example 10-dimensional embedding vector
|
30 |
+
|
31 |
return " ".join(tokens), str(encoded_output), decoded_text, embeddings
|
32 |
else:
|
33 |
return "Tokenizer not loaded correctly", "", "", []
|
|
|
48 |
description="حدد نوع المحلل اللفظي وأدخل نصًا لرؤية النتائج ومتجه التضمين.",
|
49 |
)
|
50 |
|
51 |
+
demo.launch()
|