数据集:
bigbio/gad
A corpus identifying associations between genes and diseases by a semi-automatic annotation procedure based on the Genetic Association Database.
The homepage for this dataset is no longer reachable, but the url is recorded here. Data for this dataset was originally downloaded from a google drive folder (the link used in the BLURB benchmark data download script . However, we host the data in the huggingface hub for more reliable downloads and access.
@article{Bravo2015, doi = {10.1186/s12859-015-0472-9}, url = {https://doi.org/10.1186/s12859-015-0472-9}, year = {2015}, month = feb, publisher = {Springer Science and Business Media {LLC}}, volume = {16}, number = {1}, author = {{\`{A}}lex Bravo and Janet Pi{\~{n}}ero and N{\'{u}}ria Queralt-Rosinach and Michael Rautschka and Laura I Furlong}, title = {Extraction of relations between genes and diseases from text and large-scale data analysis: implications for translational research}, journal = {{BMC} Bioinformatics} }