{ "access": { "embargo": { "active": false, "reason": null }, "files": "public", "record": "public", "status": "open" }, "created": "2021-12-09T09:08:29.255876+00:00", "custom_fields": { "meeting:meeting": { "dates": "06\u201309 September 2021", "place": "D\u00fcsseldorf, Germany", "session": "Shared Task on the Disambiguation of German Verbal Idioms", "title": "KONVENS 2021", "url": "https://konvens2021.phil.hhu.de" } }, "deletion_status": { "is_deleted": false, "status": "P" }, "files": { "count": 1, "enabled": true, "entries": { "KONVENS_2021_Disambiguation_ST-Shallow_Context_Analysis_for_German_Idiom_Detection.pdf": { "checksum": "md5:acc5ec501bcf9ccc8ba2dd6669c95c0d", "ext": "pdf", "id": "db4bc17b-8479-4c08-88f4-78f5f9fb26bf", "key": "KONVENS_2021_Disambiguation_ST-Shallow_Context_Analysis_for_German_Idiom_Detection.pdf", "metadata": null, "mimetype": "application/pdf", "size": 120284 } }, "order": [], "total_bytes": 120284 }, "id": "5769519", "is_draft": false, "is_published": true, "links": { "access": "https://zenodo.org/api/records/5769519/access", "access_links": "https://zenodo.org/api/records/5769519/access/links", "access_request": "https://zenodo.org/api/records/5769519/access/request", "access_users": "https://zenodo.org/api/records/5769519/access/users", "archive": "https://zenodo.org/api/records/5769519/files-archive", "archive_media": "https://zenodo.org/api/records/5769519/media-files-archive", "communities": "https://zenodo.org/api/records/5769519/communities", "communities-suggestions": "https://zenodo.org/api/records/5769519/communities-suggestions", "doi": "https://doi.org/10.5281/zenodo.5769519", "draft": "https://zenodo.org/api/records/5769519/draft", "files": "https://zenodo.org/api/records/5769519/files", "latest": "https://zenodo.org/api/records/5769519/versions/latest", "latest_html": "https://zenodo.org/records/5769519/latest", "media_files": "https://zenodo.org/api/records/5769519/media-files", "parent": "https://zenodo.org/api/records/5769518", "parent_doi": "https://zenodo.org/doi/10.5281/zenodo.5769518", "parent_html": "https://zenodo.org/records/5769518", "requests": "https://zenodo.org/api/records/5769519/requests", "reserve_doi": "https://zenodo.org/api/records/5769519/draft/pids/doi", "self": "https://zenodo.org/api/records/5769519", "self_doi": "https://zenodo.org/doi/10.5281/zenodo.5769519", "self_html": "https://zenodo.org/records/5769519", "self_iiif_manifest": "https://zenodo.org/api/iiif/record:5769519/manifest", "self_iiif_sequence": "https://zenodo.org/api/iiif/record:5769519/sequence/default", "versions": "https://zenodo.org/api/records/5769519/versions" }, "media_files": { "count": 0, "enabled": false, "entries": {}, "order": [], "total_bytes": 0 }, "metadata": { "creators": [ { "affiliations": [ { "name": "Leipzig University" } ], "person_or_org": { "family_name": "Amin", "given_name": "Miriam", "name": "Amin, Miriam", "type": "personal" } }, { "affiliations": [ { "name": "Leibniz Institute for the German Language" } ], "person_or_org": { "family_name": "Fankhauser", "given_name": "Peter", "name": "Fankhauser, Peter", "type": "personal" } }, { "affiliations": [ { "name": "Leibniz Institute for the German Language" } ], "person_or_org": { "family_name": "Kupietz", "given_name": "Marc", "name": "Kupietz, Marc", "type": "personal" } }, { "affiliations": [ { "name": "Leibniz Institute for the German Language" } ], "person_or_org": { "family_name": "Schneider", "given_name": "Roman", "name": "Schneider, Roman", "type": "personal" } } ], "description": "
In order to differentiate between figurative and literal usage of verb-noun combinations for the shared task on the disambiguation of German Verbal Idioms issued for KONVENS 2021, we apply and extend an approach originally developed for detecting idioms in a dataset consisting of random ngram samples. The classification is done by implementing a rather shallow, statistics-based pipeline without intensive preprocessing and examinations on the morphosyntactic and semantic level. We describe the overall approach, the differences between the original dataset and the dataset of the KONVENS task, provide experimental classification results, and analyse the individual contributions of our feature sets.
", "publication_date": "2021-09-06", "publisher": "Zenodo", "related_identifiers": [ { "identifier": "https://konvens.org/proceedings/2021/papers/KONVENS_2021_Disambiguation_ST-Shallow_Context_Analysis_for_German_Idiom_Detection.pdf", "relation_type": { "id": "isidenticalto", "title": { "de": "Ist identisch mit", "en": "Is identical to" } }, "resource_type": { "id": "publication-conferencepaper", "title": { "de": "Konferenzbeitrag", "en": "Conference paper" } }, "scheme": "url" } ], "resource_type": { "id": "publication-conferencepaper", "title": { "de": "Konferenzbeitrag", "en": "Conference paper" } }, "rights": [ { "description": { "en": "The Creative Commons Attribution license allows re-distribution and re-use of a licensed work on the condition that the creator is appropriately credited." }, "icon": "cc-by-icon", "id": "cc-by-4.0", "props": { "scheme": "spdx", "url": "https://creativecommons.org/licenses/by/4.0/legalcode" }, "title": { "en": "Creative Commons Attribution 4.0 International" } } ], "subjects": [ { "subject": "Natural Language Processing" }, { "subject": "Shared Task" }, { "subject": "Multiword Expressions" } ], "title": "Shallow Context Analysis for German Idiom Detection" }, "parent": { "access": { "owned_by": { "user": 266290 } }, "communities": {}, "id": "5769518", "pids": { "doi": { "client": "datacite", "identifier": "10.5281/zenodo.5769518", "provider": "datacite" } } }, "pids": { "doi": { "client": "datacite", "identifier": "10.5281/zenodo.5769519", "provider": "datacite" }, "oai": { "identifier": "oai:zenodo.org:5769519", "provider": "oai" } }, "revision_id": 4, "stats": { "all_versions": { "data_volume": 9261868.0, "downloads": 77, "unique_downloads": 61, "unique_views": 107, "views": 132 }, "this_version": { "data_volume": 9261868.0, "downloads": 77, "unique_downloads": 61, "unique_views": 105, "views": 130 } }, "status": "published", "updated": "2021-12-09T13:48:50.553970+00:00", "versions": { "index": 1, "is_latest": true } }