{"1379876c8e44201273f877236280c71exsample":{"DOI":"10.14618/ids-pub-10470","ISBN":"","ISSN":"","URL":"https://nbn-resolving.org/urn:nbn:de:bsz:mh39-104700","abstract":"Making research data publicly available for evaluation or reuse is a fundamental part of good scientific practice. However, regulations such as copyright law can prevent this practice and thereby hamper scientific progress. In Germany, text-based research disciplines have for a long time been mostly unable to publish corpora made from material outside of the public domain, effectively excluding contemporary works. While there are approaches to obfuscate text material in a way that it is no longer covered by the original copyright, many use cases still require the raw textual context for evaluation or follow-up research. Recent changes in copyright now permit text and data mining on copyrighted works. However, questions regarding reusability and sharing of such corpora at a later time are still not answered to a satisfying degree. We propose a workflow that allows interested third parties to access customized excerpts of protected corpora in accordance with current German copyright law and the soon to be implemented guidelines of the Digital Single Market directive. Our prototype is a very lightweight web interface that builds on commonly used repository software and web standards.","annote":"","author":[{"family":"Gärtner","given":"Markus"},{"family":"Kleinkopf","given":"Felicitas"},{"family":"Andresen","given":"Melanie"},{"family":"Hermann","given":"Sibylle"}],"citation-label":"Gaertne/etal:2021","collection-editor":[{"family":"Lüngen","given":"Harald"},{"family":"Kupietz","given":"Marc"},{"family":"Bański","given":"Piotr"},{"family":"Barbaresi","given":"Adrien"},{"family":"Clematide","given":"Simon"},{"family":"Pisetta","given":"Ines"}],"collection-title":"Proceedings of the Workshop on Challenges in the Management of Large Corpora (CMLC-9) 2021. Limerick, 12 July 2021 (Online-Event)","container-author":[{"family":"Lüngen","given":"Harald"},{"family":"Kupietz","given":"Marc"},{"family":"Bański","given":"Piotr"},{"family":"Barbaresi","given":"Adrien"},{"family":"Clematide","given":"Simon"},{"family":"Pisetta","given":"Ines"}],"container-title":"","documents":[],"edition":"","editor":[{"family":"Lüngen","given":"Harald"},{"family":"Kupietz","given":"Marc"},{"family":"Bański","given":"Piotr"},{"family":"Barbaresi","given":"Adrien"},{"family":"Clematide","given":"Simon"},{"family":"Pisetta","given":"Ines"}],"event-date":{"date-parts":[["2021"]],"literal":"2021"},"event-place":"Mannheim","id":"1379876c8e44201273f877236280c71exsample","interhash":"561f3d778c6cccefca678fedc2d802b6","intrahash":"1379876c8e44201273f877236280c71e","issue":"","issued":{"date-parts":[["2021"]],"literal":"2021"},"keyword":"myown from:hermann publist xsample lebenslauf ubprojekt","misc":{"language":"en","doi":"10.14618/ids-pub-10470"},"note":"","number":"","number-of-pages":"9","page":"10-19","page-first":"10","publisher":"Leibniz-Institut für Deutsche Sprache","publisher-place":"Mannheim","status":"","title":"Corpus reusability and copyright - challenges and opportunities","type":"paper-conference","username":"xsample","version":"","volume":""},"3b3ab5667472e629b51248c36c6bc1d6xsample":{"DOI":"","ISBN":"","ISSN":"","URL":"https://nbn-resolving.org/urn:nbn:de:0290-opus4-176043","abstract":"","annote":"","author":[{"family":"Hermann","given":"Sibylle"},{"family":"Gärtner","given":"Markus"},{"family":"Kleinkopf","given":"Felicitas"}],"citation-label":"hermann2021nutzlich","collection-editor":[],"collection-title":"","container-author":[],"container-title":"Themenkreis 6: Forschungsdaten und forschungsnahe Dienstleistungen / Forschungsdaten: Potentiale und Chancen(16.06.2021, 15:00 - 16:00 Uhr, Raum 2 (virtuell))","documents":[],"edition":"","editor":[],"event-date":{"date-parts":[["2021"]],"literal":"2021"},"event-place":"","id":"3b3ab5667472e629b51248c36c6bc1d6xsample","interhash":"21de706376f6e313e0dd477c458fc6a2","intrahash":"3b3ab5667472e629b51248c36c6bc1d6","issue":"","issued":{"date-parts":[["2021"]],"literal":"2021"},"keyword":"myown presentlist from:hermann xsample ubvortrag","note":"","number":"","page":"","page-first":"","publisher":"","publisher-place":"","status":"","title":"Von nützlich zu nutzbar - Zugang zu geschützten Forschungsdaten ermöglichen","type":"speech","username":"xsample","version":"","volume":""},"7c3f535bf2385881cbb0b7b0366dfb56xsample":{"DOI":"https://doi.org/10.5446/49264","ISBN":"","ISSN":"","URL":"","abstract":"","annote":"","author":[{"family":"Hermann","given":"Sibylle"},{"family":"Kleinkopf","given":"Felicitas"},{"family":"Gärtner","given":"Markus"}],"citation-label":"hermann2020xsample","collection-editor":[],"collection-title":"","container-author":[],"container-title":"","documents":[],"edition":"","editor":[],"event-date":{"date-parts":[["2020"]],"literal":"2020"},"event-place":"","id":"7c3f535bf2385881cbb0b7b0366dfb56xsample","interhash":"3319907d28400fc148a7bee3a352953c","intrahash":"7c3f535bf2385881cbb0b7b0366dfb56","issue":"","issued":{"date-parts":[["2020"]],"literal":"2020"},"keyword":"myown presentlist from:hermann ubvortrag","misc":{"eventtitle":"Open-Access-Tage 2020","doi":"https://doi.org/10.5446/49264"},"note":"","number":"","page":"","page-first":"","publisher":"","publisher-place":"","status":"","title":"Xsample: Text und Data Mining auf geschützten Werken durch Auszüge transparent erschließen","type":"speech","username":"xsample","version":"","volume":""},"4e85b8f46a5e0d5d770f71d2b7d7c6cfxsample":{"DOI":"10.18419/opus-11445","ISBN":"","ISSN":"","URL":"","abstract":"","annote":"","author":[{"family":"Kleinkopf","given":"Felicitas"},{"family":"Jacke","given":"Janina"},{"family":"Gärtner","given":"Markus"}],"citation-label":"kleinkopf2021urheberrechtliche","collection-editor":[],"collection-title":"","container-author":[],"container-title":"Erstpublikation: MMMR Zeitschrift für IT-Recht und Recht der Digitalisierung","documents":[],"edition":"","editor":[],"event-date":{"date-parts":[["2021"]],"literal":"2021"},"event-place":"","id":"4e85b8f46a5e0d5d770f71d2b7d7c6cfxsample","interhash":"199757b961b58b0879cfefc7310adb41","intrahash":"4e85b8f46a5e0d5d770f71d2b7d7c6cf","issue":"","issued":{"date-parts":[["2021"]],"literal":"2021"},"keyword":"from:hermann pub","misc":{"doi":"10.18419/opus-11445"},"note":"","number":"","page":"196 ff.","page-first":"196","publisher":"","publisher-place":"","status":"","title":"Text- und Data-Mining Urheberrechtliche Grenzen der Nachnutzung wissenschaftlicher Korpora bei computergestützten Verfahren und digitalen Ressourcen","type":"article-journal","username":"xsample","version":"","volume":"3"},"0f1ffc6145376841942eac695cb864c3xsample":{"DOI":"10.14618/IDS-PUB-10467","ISBN":"","ISSN":"","URL":"https://ids-pub.bsz-bw.de/10467","abstract":"","annote":"","author":[{"family":"Gärtner","given":"Markus"},{"family":"Kleinkopf","given":"Felicitas"},{"family":"Andresen","given":"Melanie"},{"family":"Hermann","given":"Sybille"}],"citation-label":"grtner2021corpus","collection-editor":[{"family":"Lüngen","given":"Harald"},{"family":"Kupietz","given":"Marc"},{"family":"Bański","given":"Piotr"},{"family":"Barbaresi","given":"Adrien"},{"family":"Clematide","given":"Simon"},{"family":"Pisetta","given":"Ines"}],"collection-title":"","container-author":[{"family":"Lüngen","given":"Harald"},{"family":"Kupietz","given":"Marc"},{"family":"Bański","given":"Piotr"},{"family":"Barbaresi","given":"Adrien"},{"family":"Clematide","given":"Simon"},{"family":"Pisetta","given":"Ines"}],"container-title":"Proceedings of the Workshop on Challenges in the Management of Large Corpora (CMLC-9) 2021. Limerick, 12 July 2021 (Online-Event)","documents":[],"edition":"","editor":[{"family":"Lüngen","given":"Harald"},{"family":"Kupietz","given":"Marc"},{"family":"Bański","given":"Piotr"},{"family":"Barbaresi","given":"Adrien"},{"family":"Clematide","given":"Simon"},{"family":"Pisetta","given":"Ines"}],"event-date":{"date-parts":[["2021"]],"literal":"2021"},"event-place":"","id":"0f1ffc6145376841942eac695cb864c3xsample","interhash":"561f3d778c6cccefca678fedc2d802b6","intrahash":"0f1ffc6145376841942eac695cb864c3","issue":"","issued":{"date-parts":[["2021"]],"literal":"2021"},"keyword":"from:hermann pub","misc":{"copyright":"Creative Commons - CC BY - Namensnennung 4.0 International","language":"en","doi":"10.14618/IDS-PUB-10467"},"note":"","number":"","page":"","page-first":"","publisher":"Leibniz-Institut für Deutsche Sprache","publisher-place":"","status":"","title":"Corpus Reusability and Copyright – Challenges and Opportunities","type":"paper-conference","username":"xsample","version":"","volume":""}}