Dataset Groups Activity Stream Harvard USPTO Patent Dataset The Harvard USPTO Dataset is a large-scale, well-structured, and multi-purpose corpus of patent applications. BibTex: @dataset{You_Zuo_and_Kim_Gerdes_and_Éric_de_la_Clergerie_and_Benoît_Sagot_2024, abstract = {The Harvard USPTO Dataset is a large-scale, well-structured, and multi-purpose corpus of patent applications.}, author = {You Zuo and Kim Gerdes and Éric de la Clergerie and Benoît Sagot}, doi = {10.57702/ld0ofixt}, institution = {No Organization}, keyword = {'USPTO', 'natural language processing', 'patent applications'}, month = {dec}, publisher = {TIB}, title = {Harvard USPTO Patent Dataset}, url = {https://service.tib.eu/ldmservice/dataset/harvard-uspto-patent-dataset}, year = {2024} }