{"d0fefb948fda82ed6ffe4eea87281c7fdiglezakis":{"DOI":"10.1162/qss_a_00049","ISBN":"","ISSN":"2641-3337","URL":"https://doi.org/10.1162/qss\\_a\\_00049","abstract":"Many interesting use cases of research data classifiers presuppose that a research data item can be mapped to more than one field of study, but for such classification mechanisms, reproducible evaluations are lacking. This paper closes this gap: It describes the creation of a training and evaluation set comprised of labeled metadata, evaluates several supervised classification approaches, and comments on their application in scientometric research. The metadata were retrieved from the DataCite index of research data, pre processed, and compiled into a set of 613,585 records. According to our experiments with 20 general fields of study, multi layer perceptron models perform best, followed by long short-term memory models. The models can be used in scientometric research, for example to analyze interdisciplinary trends of digital scholarly output or to characterize growth patterns of research data, stratified by field of study. Our findings allow us to estimate errors in applying the models. The best performing models and the data used for their training are available for re use.","annote":"","author":[{"family":"Weber","given":"Tobias"},{"family":"Kranzlmüller","given":"Dieter"},{"family":"Fromm","given":"Michael"},{"family":"de Sousa","given":"Nelson Tavares"}],"citation-label":"10.1162/qss_a_00049","collection-editor":[],"collection-title":"","container-author":[],"container-title":"Quantitative Science Studies","documents":[],"edition":"","editor":[],"event-date":{"date-parts":[["2020","06"]],"literal":"2020"},"event-place":"","id":"d0fefb948fda82ed6ffe4eea87281c7fdiglezakis","interhash":"2073dbed64ec28747366e3c59d7f72da","intrahash":"d0fefb948fda82ed6ffe4eea87281c7f","issue":"2","issued":{"date-parts":[["2020","06"]],"literal":"2020"},"keyword":"forschungsdaten artificialIntelligence subjectIndexing automated","misc":{"eprint":"https://direct.mit.edu/qss/article-pdf/1/2/525/1885831/qss\\_a\\_00049.pdf","issn":"2641-3337","doi":"10.1162/qss_a_00049"},"note":"","number":"2","number-of-pages":"25","page":"525-550","page-first":"525","publisher":"","publisher-place":"","status":"","title":"Using supervised learning to classify metadata of research data by field of study","type":"article-journal","username":"diglezakis","version":"","volume":"1"},"e8528813e07745135835c57183eabb11diglezakis":{"DOI":"","ISBN":"","ISSN":"1869-1137","URL":"http://hdl.handle.net/11108/627","abstract":"","annote":"","author":[{"family":"Kasprzik","given":"Anna"}],"citation-label":"kasprzik2024knstliche","collection-editor":[{"family":"(BIB)","given":"Berufsverband Information Bibliothek"}],"collection-title":"","container-author":[{"family":"(BIB)","given":"Berufsverband Information Bibliothek"}],"container-title":"BuB - Forum Bibliothek und Information","documents":[],"edition":"","editor":[{"family":"(BIB)","given":"Berufsverband Information Bibliothek"}],"event-date":{"date-parts":[["2024"]],"literal":"2024"},"event-place":"","id":"e8528813e07745135835c57183eabb11diglezakis","interhash":"fe364d013e08b0e40096b5d479b21a41","intrahash":"e8528813e07745135835c57183eabb11","issue":"08-09","issued":{"date-parts":[["2024"]],"literal":"2024"},"keyword":"artificialIntelligence subjectIndexing automated da-fdm","misc":{"issn":"1869-1137"},"note":"","number":"08-09","number-of-pages":"3","page":"442-445","page-first":"442","publisher":"","publisher-place":"","status":"","title":"Künstliche Intelligenz für die Inhaltserschließung – ein Statusupdate","type":"article-journal","username":"diglezakis","version":"","volume":"76"},"993ffe08eb3813d0a25b30b88a2d8b0fdiglezakis":{"DOI":"","ISBN":"","ISSN":"","URL":"https://arxiv.org/abs/2405.11706","abstract":"","annote":"","author":[{"family":"Allemang","given":"Dean"},{"family":"Sequeda","given":"Juan"}],"citation-label":"allemang2024increasingllmaccuracyquestion","collection-editor":[],"collection-title":"","container-author":[],"container-title":"","documents":[],"edition":"","editor":[],"event-date":{"date-parts":[["2024"]],"literal":"2024"},"event-place":"","id":"993ffe08eb3813d0a25b30b88a2d8b0fdiglezakis","interhash":"d2f87ced0951cd393afba2fc4f3b7bb9","intrahash":"993ffe08eb3813d0a25b30b88a2d8b0f","issue":"","issued":{"date-parts":[["2024"]],"literal":"2024"},"keyword":"metadata ontologie artificialIntelligence llm","misc":{"eprint":"2405.11706","archiveprefix":"arXiv","primaryclass":"cs.AI"},"note":"","number":"","page":"","page-first":"","publisher":"","publisher-place":"","status":"","title":"Increasing the LLM Accuracy for Question Answering: Ontologies to the Rescue!","type":"article","username":"diglezakis","version":"","volume":""},"d2260d8bcf30d2358a8f5113c43706c0diglezakis":{"DOI":"","ISBN":"","ISSN":"","URL":"","abstract":"","annote":"","author":[{"family":"Gundersen","given":"Odd Erik"},{"family":"Kjensmo","given":"Sigbjørn"}],"citation-label":"gundersen2018state","collection-editor":[{"family":"McIlraith","given":"Sheila"},{"family":"Weinberger","given":"Kilian"}],"collection-title":"","container-author":[{"family":"McIlraith","given":"Sheila"},{"family":"Weinberger","given":"Kilian"}],"container-title":"Proceedings of the 32nd AAAI Conference on Artificial Intelligence (AAAI-18)","documents":[],"edition":"","editor":[{"family":"McIlraith","given":"Sheila"},{"family":"Weinberger","given":"Kilian"}],"event-date":{"date-parts":[["2018"]],"literal":"2018"},"event-place":"","id":"d2260d8bcf30d2358a8f5113c43706c0diglezakis","interhash":"d751c2dec9822c6feb4557861102c792","intrahash":"d2260d8bcf30d2358a8f5113c43706c0","issue":"","issued":{"date-parts":[["2018"]],"literal":"2018"},"keyword":"forschungsdaten software reproducibility artificialIntelligence","misc":{"language":"en","eventtitle":"The Thirty-Second AAAI Conference on Artificial Intelligence (AAAI-18)","eventdate":"February 2–7, 2018","venue":"New Orleans, Louisiana, USA"},"note":"","number":"","page":"","page-first":"","publisher":"Association for the Advancement of Artificial Intelligence","publisher-place":"","status":"","title":"State of the Art: Reproducibility in Artificial Intelligence","type":"paper-conference","username":"diglezakis","version":"","volume":""}}