{ "access": { "embargo": { "active": false, "reason": null }, "files": "public", "record": "public", "status": "open" }, "created": "2018-04-01T17:41:03.415830+00:00", "custom_fields": { "meeting:meeting": { "acronym": "BTW", "dates": "11-15 March 2013", "place": "Magdeburg, Germany", "title": "Datenbanksysteme f\u00fcr Business, Technologie und Web", "url": "http://www.btw-2013.de/proceedings/Applying%20Stratosphere%20for%20Big%20Data%20Analytics.pdf" } }, "deletion_status": { "is_deleted": false, "status": "P" }, "files": { "count": 2, "enabled": true, "entries": { "2013-btw.pdf": { "checksum": "md5:47965773d1d2e345bbef7caa22714e70", "ext": "pdf", "id": "01cbc460-0ac0-4dd2-8a56-b6dd49753867", "key": "2013-btw.pdf", "metadata": null, "mimetype": "application/pdf", "size": 970718 }, "bib.bib": { "checksum": "md5:7133a14d23b07c2c494bce90929eb4ec", "ext": "bib", "id": "537f2446-a96b-44e4-a370-81e7e12be520", "key": "bib.bib", "metadata": null, "mimetype": "application/octet-stream", "size": 1209 } }, "order": [], "total_bytes": 971927 }, "id": "1210857", "is_draft": false, "is_published": true, "links": { "access": "https://zenodo.org/api/records/1210857/access", "access_links": "https://zenodo.org/api/records/1210857/access/links", "access_request": "https://zenodo.org/api/records/1210857/access/request", "access_users": "https://zenodo.org/api/records/1210857/access/users", "archive": "https://zenodo.org/api/records/1210857/files-archive", "archive_media": "https://zenodo.org/api/records/1210857/media-files-archive", "communities": "https://zenodo.org/api/records/1210857/communities", "communities-suggestions": "https://zenodo.org/api/records/1210857/communities-suggestions", "doi": "https://doi.org/10.5281/zenodo.1210857", "draft": "https://zenodo.org/api/records/1210857/draft", "files": "https://zenodo.org/api/records/1210857/files", "latest": "https://zenodo.org/api/records/1210857/versions/latest", "latest_html": "https://zenodo.org/records/1210857/latest", "media_files": "https://zenodo.org/api/records/1210857/media-files", "parent": "https://zenodo.org/api/records/1210856", "parent_doi": "https://zenodo.org/doi/10.5281/zenodo.1210856", "parent_html": "https://zenodo.org/records/1210856", "requests": "https://zenodo.org/api/records/1210857/requests", "reserve_doi": "https://zenodo.org/api/records/1210857/draft/pids/doi", "self": "https://zenodo.org/api/records/1210857", "self_doi": "https://zenodo.org/doi/10.5281/zenodo.1210857", "self_html": "https://zenodo.org/records/1210857", "self_iiif_manifest": "https://zenodo.org/api/iiif/record:1210857/manifest", "self_iiif_sequence": "https://zenodo.org/api/iiif/record:1210857/sequence/default", "versions": "https://zenodo.org/api/records/1210857/versions" }, "media_files": { "count": 0, "enabled": false, "entries": {}, "order": [], "total_bytes": 0 }, "metadata": { "creators": [ { "affiliations": [ { "name": "Leich" } ], "person_or_org": { "family_name": "Marcus", "name": "Marcus", "type": "personal" } }, { "affiliations": [ { "name": "Adamek" } ], "person_or_org": { "family_name": "Jochen", "name": "Jochen", "type": "personal" } }, { "affiliations": [ { "name": "Schubotz" } ], "person_or_org": { "family_name": "Moritz", "identifiers": [ { "identifier": "0000-0001-7141-4997", "scheme": "orcid" } ], "name": "Moritz", "type": "personal" } }, { "affiliations": [ { "name": "Rheinl\u00e4nder" } ], "person_or_org": { "family_name": "Astrid", "name": "Astrid", "type": "personal" } }, { "affiliations": [ { "name": "Markl" } ], "person_or_org": { "family_name": "Volker", "name": "Volker", "type": "personal" } } ], "description": "
Analyzing big data sets as they occur in modern business and science applications requires query languages that allow for the specification of complex data processing tasks. Moreover, these ideally declarative query specifications have to be optimized, parallelized and scheduled for processing on massively parallel data processing platforms. This paper demonstrates the application of Stratosphere to different kinds of Big Data Analytics tasks. Using examples from different application domains, we show how to formulate analytical tasks as Meteor queries and execute them with Stratosphere. These examples include data cleansing and information extraction tasks, and a correlation analysis of microblogging and stock trade volume data that we describe in detail in this paper.
", "languages": [ { "id": "eng", "title": { "en": "English" } } ], "publication_date": "2013-03-11", "publisher": "Zenodo", "related_identifiers": [ { "identifier": "http://cs.emis.de/LNI/Proceedings/Proceedings214/507.pdf", "relation_type": { "id": "isidenticalto", "title": { "de": "Ist identisch mit", "en": "Is identical to" } }, "resource_type": { "id": "publication-conferencepaper", "title": { "de": "Konferenzbeitrag", "en": "Conference paper" } }, "scheme": "url" } ], "resource_type": { "id": "publication-conferencepaper", "title": { "de": "Konferenzbeitrag", "en": "Conference paper" } }, "rights": [ { "description": { "en": "The Creative Commons Attribution license allows re-distribution and re-use of a licensed work on the condition that the creator is appropriately credited." }, "icon": "cc-by-icon", "id": "cc-by-4.0", "props": { "scheme": "spdx", "url": "https://creativecommons.org/licenses/by/4.0/legalcode" }, "title": { "en": "Creative Commons Attribution 4.0 International" } } ], "title": "Applying Stratosphere for Big Data Analytics" }, "parent": { "access": { "owned_by": { "user": 40009 } }, "communities": {}, "id": "1210856", "pids": { "doi": { "client": "datacite", "identifier": "10.5281/zenodo.1210856", "provider": "datacite" } } }, "pids": { "doi": { "client": "datacite", "identifier": "10.5281/zenodo.1210857", "provider": "datacite" }, "oai": { "identifier": "oai:zenodo.org:1210857", "provider": "oai" } }, "revision_id": 7, "stats": { "all_versions": { "data_volume": 25242295.0, "downloads": 29, "unique_downloads": 28, "unique_views": 47, "views": 64 }, "this_version": { "data_volume": 25242295.0, "downloads": 29, "unique_downloads": 28, "unique_views": 47, "views": 64 } }, "status": "published", "updated": "2020-02-28T14:33:56.421633+00:00", "versions": { "index": 1, "is_latest": true } }