{ "access": { "embargo": { "active": false, "reason": null }, "files": "public", "record": "public", "status": "open" }, "created": "2019-10-15T10:50:38.493145+00:00", "custom_fields": { "legacy:subjects": [ { "identifier": "https://dewey.info/", "scheme": "url", "term": "004 Data processing & computer science" }, { "identifier": "https://dewey.info/", "scheme": "url", "term": "020 Library & information sciences" } ] }, "deletion_status": { "is_deleted": false, "status": "P" }, "files": { "count": 1, "enabled": true, "entries": { "paper_data.tar.gz": { "checksum": "md5:e93b229739ae7f646dbeed16233cdc9b", "ext": "gz", "id": "e8f6464a-0024-40d4-a975-565076b4b58b", "key": "paper_data.tar.gz", "metadata": null, "mimetype": "application/gzip", "size": 91409 } }, "order": [], "total_bytes": 91409 }, "id": "3490468", "is_draft": false, "is_published": true, "links": { "access": "https://zenodo.org/api/records/3490468/access", "access_links": "https://zenodo.org/api/records/3490468/access/links", "access_request": "https://zenodo.org/api/records/3490468/access/request", "access_users": "https://zenodo.org/api/records/3490468/access/users", "archive": "https://zenodo.org/api/records/3490468/files-archive", "archive_media": "https://zenodo.org/api/records/3490468/media-files-archive", "communities": "https://zenodo.org/api/records/3490468/communities", "communities-suggestions": "https://zenodo.org/api/records/3490468/communities-suggestions", "doi": "https://doi.org/10.5281/zenodo.3490468", "draft": "https://zenodo.org/api/records/3490468/draft", "files": "https://zenodo.org/api/records/3490468/files", "latest": "https://zenodo.org/api/records/3490468/versions/latest", "latest_html": "https://zenodo.org/records/3490468/latest", "media_files": "https://zenodo.org/api/records/3490468/media-files", "parent": "https://zenodo.org/api/records/3490467", "parent_doi": "https://zenodo.org/doi/10.5281/zenodo.3490467", "parent_html": "https://zenodo.org/records/3490467", "requests": "https://zenodo.org/api/records/3490468/requests", "reserve_doi": "https://zenodo.org/api/records/3490468/draft/pids/doi", "self": "https://zenodo.org/api/records/3490468", "self_doi": "https://zenodo.org/doi/10.5281/zenodo.3490468", "self_html": "https://zenodo.org/records/3490468", "self_iiif_manifest": "https://zenodo.org/api/iiif/record:3490468/manifest", "self_iiif_sequence": "https://zenodo.org/api/iiif/record:3490468/sequence/default", "versions": "https://zenodo.org/api/records/3490468/versions" }, "media_files": { "count": 0, "enabled": false, "entries": {}, "order": [], "total_bytes": 0 }, "metadata": { "creators": [ { "affiliations": [ { "name": "Leibniz Supercomputing Centre" } ], "person_or_org": { "family_name": "Tobias Weber", "identifiers": [ { "identifier": "0000-0003-1815-7041", "scheme": "orcid" } ], "name": "Tobias Weber", "type": "personal" } }, { "affiliations": [ { "name": "Database Systems Group, Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen" } ], "person_or_org": { "family_name": "Michael Fromm", "identifiers": [ { "identifier": "0000-0002-7244-4191", "scheme": "orcid" } ], "name": "Michael Fromm", "type": "personal" } }, { "affiliations": [ { "name": "Software Engineering Group, Kiel University" } ], "person_or_org": { "family_name": "Nelson Tavares de Sousa", "identifiers": [ { "identifier": "0000-0003-1866-7156", "scheme": "orcid" } ], "name": "Nelson Tavares de Sousa", "type": "personal" } } ], "description": "
Automated classification of metadata of research data by their discipline(s) of research can be used in scientometric research, by repository service providers, and in the context of research data aggregation services. Openly available metadata of the DataCite index for research data were used to compile a large training and evaluation set comprised of 609,524 records. This publication contains aggregated data for the paper. It also contains the evaluation data of all model/hyper-parameter training and test runs.
", "publication_date": "2019-10-15", "publisher": "Zenodo", "resource_type": { "id": "dataset", "title": { "de": "Datensatz", "en": "Dataset" } }, "rights": [ { "description": { "en": "The Creative Commons Attribution license allows re-distribution and re-use of a licensed work on the condition that the creator is appropriately credited." }, "icon": "cc-by-icon", "id": "cc-by-4.0", "props": { "scheme": "spdx", "url": "https://creativecommons.org/licenses/by/4.0/legalcode" }, "title": { "en": "Creative Commons Attribution 4.0 International" } } ], "subjects": [ { "subject": "supervised machine learning" }, { "subject": "multi-label classification" }, { "subject": "research data" }, { "subject": "text processing" }, { "subject": "data science" }, { "subject": "disciplines of research" } ], "title": "Statistics and Evaluation Data for Publication \"Using Supervised Learning to Classify Metadata of Research Data by Discipline of Research\"" }, "parent": { "access": { "owned_by": { "user": 64749 } }, "communities": {}, "id": "3490467", "pids": { "doi": { "client": "datacite", "identifier": "10.5281/zenodo.3490467", "provider": "datacite" } } }, "pids": { "doi": { "client": "datacite", "identifier": "10.5281/zenodo.3490468", "provider": "datacite" }, "oai": { "identifier": "oai:zenodo.org:3490468", "provider": "oai" } }, "revision_id": 8, "stats": { "all_versions": { "data_volume": 797694949.0, "downloads": 8709, "unique_downloads": 8121, "unique_views": 4662, "views": 5978 }, "this_version": { "data_volume": 794069983.0, "downloads": 8687, "unique_downloads": 8099, "unique_views": 4266, "views": 5561 } }, "status": "published", "updated": "2020-05-24T11:34:02.128373+00:00", "versions": { "index": 1, "is_latest": false } }