数据集:
cfilt/iwn_wordlists
We provide the unique word list form the IndoWordnet (IWN) knowledge base.
from datasets import load_dataset language = "hindi" // supported languages: assamese, bengali, bodo, gujarati, hindi, kannada, kashmiri, konkani, malayalam, manipuri, marathi, meitei, nepali, oriya, punjabi, sanskrit, tamil, telugu, urdu. words = load_dataset("cfilt/iwn_wordlists", language) word_list = words["train"]["word"]
@inproceedings{bhattacharyya2010indowordnet, title={IndoWordNet}, author={Bhattacharyya, Pushpak}, booktitle={Proceedings of the Seventh International Conference on Language Resources and Evaluation (LREC'10)}, year={2010} }