Dataset Groups Activity Stream ProtST The ProtST dataset is a collection of protein sequences and their corresponding biomedical text descriptions. BibTex: @dataset{Minghao_Xu_and_Zuobai_Zhang_and_Jiarui_Lu_and_Zhaocheng_Zhu_and_Yangtian_Zhang_and_Ma_Chang_and_Runcheng_Liu_and_Jian_Tang_2024, abstract = {The ProtST dataset is a collection of protein sequences and their corresponding biomedical text descriptions.}, author = {Minghao Xu and Zuobai Zhang and Jiarui Lu and Zhaocheng Zhu and Yangtian Zhang and Ma Chang and Runcheng Liu and Jian Tang}, doi = {10.57702/wqf3k9xu}, institution = {No Organization}, keyword = {'biomedical text', 'protein sequence', 'sequence analysis'}, month = {dec}, publisher = {TIB}, title = {ProtST}, url = {https://service.tib.eu/ldmservice/dataset/protst}, year = {2024} }