{ "access": { "embargo": { "active": false, "reason": null }, "files": "public", "record": "public", "status": "open" }, "created": "2021-10-05T15:54:40.648553+00:00", "custom_fields": { "meeting:meeting": { "acronym": "ICCV", "dates": "11-17 October 2021", "place": "Virtual", "title": "International Conference on Computer Vision", "url": "https://iccv2021.thecvf.com/" } }, "deletion_status": { "is_deleted": false, "status": "P" }, "files": { "count": 1, "enabled": true, "entries": { "08992.pdf": { "checksum": "md5:1be1739a32b6463d6f383bba4609ccf1", "ext": "pdf", "id": "fe3dc4b0-382d-4d1a-a512-faccb9d53059", "key": "08992.pdf", "metadata": null, "mimetype": "application/pdf", "size": 4834776 } }, "order": [], "total_bytes": 4834776 }, "id": "5550474", "is_draft": false, "is_published": true, "links": { "access": "https://zenodo.org/api/records/5550474/access", "access_links": "https://zenodo.org/api/records/5550474/access/links", "access_request": "https://zenodo.org/api/records/5550474/access/request", "access_users": "https://zenodo.org/api/records/5550474/access/users", "archive": "https://zenodo.org/api/records/5550474/files-archive", "archive_media": "https://zenodo.org/api/records/5550474/media-files-archive", "communities": "https://zenodo.org/api/records/5550474/communities", "communities-suggestions": "https://zenodo.org/api/records/5550474/communities-suggestions", "doi": "https://doi.org/10.5281/zenodo.5550474", "draft": "https://zenodo.org/api/records/5550474/draft", "files": "https://zenodo.org/api/records/5550474/files", "latest": "https://zenodo.org/api/records/5550474/versions/latest", "latest_html": "https://zenodo.org/records/5550474/latest", "media_files": "https://zenodo.org/api/records/5550474/media-files", "parent": "https://zenodo.org/api/records/5550473", "parent_doi": "https://zenodo.org/doi/10.5281/zenodo.5550473", "parent_html": "https://zenodo.org/records/5550473", "requests": "https://zenodo.org/api/records/5550474/requests", "reserve_doi": "https://zenodo.org/api/records/5550474/draft/pids/doi", "self": "https://zenodo.org/api/records/5550474", "self_doi": "https://zenodo.org/doi/10.5281/zenodo.5550474", "self_html": "https://zenodo.org/records/5550474", "self_iiif_manifest": "https://zenodo.org/api/iiif/record:5550474/manifest", "self_iiif_sequence": "https://zenodo.org/api/iiif/record:5550474/sequence/default", "versions": "https://zenodo.org/api/records/5550474/versions" }, "media_files": { "count": 0, "enabled": false, "entries": {}, "order": [], "total_bytes": 0 }, "metadata": { "creators": [ { "affiliations": [ { "name": "Queen Mary University of London" } ], "person_or_org": { "family_name": "Christos Tzelepis", "name": "Christos Tzelepis", "type": "personal" } }, { "affiliations": [ { "name": "Queen Mary University of London" } ], "person_or_org": { "family_name": "Georgios Tzimiropoulos", "name": "Georgios Tzimiropoulos", "type": "personal" } }, { "affiliations": [ { "name": "Queen Mary University of London" } ], "person_or_org": { "family_name": "Ioannis Patras", "name": "Ioannis Patras", "type": "personal" } } ], "description": "
This work addresses the problem of discovering, in an unsupervised manner, interpretable paths in the latent space of pretrained GANs, so as to provide an intuitive and easy way of controlling the underlying generative factors. In doing so, it addresses some of the limitations of the state-of-the-art works, namely, a) that they discover directions that are independent of the latent code, i.e., paths that are linear, and b) that their evaluation relies either on visual inspection or on laborious human labeling. More specifically, we propose to learn non-linear warpings on the latent space, each one parametrized by a set of RBF-based latent space warping functions, and where each warping gives rise to a family of non-linear paths via the gradient of the function. Building on the work of Voynov and Babenko, that discovers linear paths, we optimize the trainable parameters of the set of RBFs, so as that images that are generated by codes along different paths, are easily distinguishable by a discriminator network. This leads to easily distinguishable image transformations, such as pose and facial expressions in facial images. We show that linear paths can be derived as a special case of our method, and show experimentally that non-linear paths in the latent space lead to steeper, more disentangled and interpretable changes in the image space than in state-of-the art methods, both qualitatively and quantitatively. We make the code and the pretrained models publicly available at: https://github.com/chi0tzp/WarpedGANSpace.
", "funding": [ { "award": { "acronym": "AI4Media", "id": "00k4n6c32::951911", "identifiers": [ { "identifier": "https://cordis.europa.eu/projects/951911", "scheme": "url" } ], "number": "951911", "program": "H2020", "title": { "en": "A European Excellence Centre for Media, Society and Democracy" } }, "funder": { "id": "00k4n6c32", "name": "European Commission" } } ], "publication_date": "2021-10-05", "publisher": "Zenodo", "resource_type": { "id": "publication-conferencepaper", "title": { "de": "Konferenzbeitrag", "en": "Conference paper" } }, "rights": [ { "description": { "en": "The Creative Commons Attribution license allows re-distribution and re-use of a licensed work on the condition that the creator is appropriately credited." }, "icon": "cc-by-icon", "id": "cc-by-4.0", "props": { "scheme": "spdx", "url": "https://creativecommons.org/licenses/by/4.0/legalcode" }, "title": { "en": "Creative Commons Attribution 4.0 International" } } ], "title": "WarpedGANSpace: Finding non-linear RBF paths in GAN latent space" }, "parent": { "access": { "owned_by": { "user": 257675 } }, "communities": { "default": "8538384b-cd84-4cc6-a77c-c259e9568dfd", "entries": [ { "access": { "member_policy": "open", "members_visibility": "public", "record_policy": "open", "review_policy": "open", "visibility": "public" }, "children": { "allow": false }, "created": "2020-10-22T12:35:38.515614+00:00", "custom_fields": {}, "deletion_status": { "is_deleted": false, "status": "P" }, "id": "8538384b-cd84-4cc6-a77c-c259e9568dfd", "links": {}, "metadata": { "curation_policy": "This community will accept all uploads that have been generated by partners of the AI4Media consortium that received funding from the project.
\r\n", "description": "Horizon H2020 EC-funded project AI4Media: A European Excellence Centre for Media, Society and Democracy", "page": "Motivated by the challenges, risks and opportunities that the widespread use of artificial intelligence (AI) has brought to the media, society and politics, the EU-funded AI4Media project aspires to establish a centre of excellence and a wide network of researchers across Europe and beyond. Its focus will be on delivering the next generation of core AI advances to serve the key sector of media, making sure that European values surrounding ethical and trustworthy AI are embedded in future AI deployments. The project will be supplemented by a funding framework, a PhD programme and a set of use cases to demonstrate the impact of the actions taken on the media sector.
\r\n", "title": "AI4Media H2020 Project" }, "revision_id": 0, "slug": "ai4media", "updated": "2020-10-22T12:35:38.584014+00:00" } ], "ids": [ "8538384b-cd84-4cc6-a77c-c259e9568dfd" ] }, "id": "5550473", "pids": { "doi": { "client": "datacite", "identifier": "10.5281/zenodo.5550473", "provider": "datacite" } } }, "pids": { "doi": { "client": "datacite", "identifier": "10.5281/zenodo.5550474", "provider": "datacite" }, "oai": { "identifier": "oai:zenodo.org:5550474", "provider": "oai" } }, "revision_id": 4, "stats": { "all_versions": { "data_volume": 410955960.0, "downloads": 85, "unique_downloads": 82, "unique_views": 132, "views": 141 }, "this_version": { "data_volume": 410955960.0, "downloads": 85, "unique_downloads": 82, "unique_views": 132, "views": 141 } }, "status": "published", "updated": "2021-10-06T01:48:31.542502+00:00", "versions": { "index": 1, "is_latest": true } }