Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
import gensim.downloader as api | |
model = api.load("glove-twitter-200") | |
print("Model loaded.") | |
print("new-york" in model.key_to_index) # β True if token is present | |
print("new" in model.key_to_index) # β Also true | |
print("new york" in model.key_to_index) # β False β space not valid | |
# Optional: print 5 most similar to test | |
if "new-york" in model.key_to_index: | |
print(model.most_similar("new-york")) | |
compound_terms = [key for key in model.key_to_index if "-" in key] | |
print(f"Sample compound tokens: {compound_terms[:10]}") | |
model.save("../models/cbow_model.kv") | |