Conference paper Open Access

Flow R-CNN: Flow-Enhanced Object Detection

Psaltis, Athanasios; Dimou, Anastasios; Alvarez, Federico; Daras, Petros


DataCite XML Export

<?xml version='1.0' encoding='utf-8'?>
<resource xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns="http://datacite.org/schema/kernel-4" xsi:schemaLocation="http://datacite.org/schema/kernel-4 http://schema.datacite.org/meta/kernel-4.1/metadata.xsd">
  <identifier identifierType="URL">https://zenodo.org/record/4603216</identifier>
  <creators>
    <creator>
      <creatorName>Psaltis, Athanasios</creatorName>
      <givenName>Athanasios</givenName>
      <familyName>Psaltis</familyName>
      <affiliation>CERTH</affiliation>
    </creator>
    <creator>
      <creatorName>Dimou, Anastasios</creatorName>
      <givenName>Anastasios</givenName>
      <familyName>Dimou</familyName>
      <affiliation>CERTH</affiliation>
    </creator>
    <creator>
      <creatorName>Alvarez, Federico</creatorName>
      <givenName>Federico</givenName>
      <familyName>Alvarez</familyName>
    </creator>
    <creator>
      <creatorName>Daras, Petros</creatorName>
      <givenName>Petros</givenName>
      <familyName>Daras</familyName>
      <affiliation>CERTH</affiliation>
    </creator>
  </creators>
  <titles>
    <title>Flow R-CNN: Flow-Enhanced Object Detection</title>
  </titles>
  <publisher>Zenodo</publisher>
  <publicationYear>2021</publicationYear>
  <dates>
    <date dateType="Issued">2021-02-21</date>
  </dates>
  <resourceType resourceTypeGeneral="ConferencePaper"/>
  <alternateIdentifiers>
    <alternateIdentifier alternateIdentifierType="url">https://zenodo.org/record/4603216</alternateIdentifier>
  </alternateIdentifiers>
  <relatedIdentifiers>
    <relatedIdentifier relatedIdentifierType="DOI" relationType="IsIdenticalTo">10.1007/978-3-030-68763-2_52</relatedIdentifier>
    <relatedIdentifier relatedIdentifierType="URL" relationType="IsPartOf">https://zenodo.org/communities/787061</relatedIdentifier>
  </relatedIdentifiers>
  <rightsList>
    <rights rightsURI="https://creativecommons.org/licenses/by/4.0/legalcode">Creative Commons Attribution 4.0 International</rights>
    <rights rightsURI="info:eu-repo/semantics/openAccess">Open Access</rights>
  </rightsList>
  <descriptions>
    <description descriptionType="Abstract">&lt;p&gt;This work addresses the problem of multi-task object detection in an efficient, generic but at the same time simple way, following the recent and highly promising studies in the computer vision field, and more specifically the Region-based Convolutional Neural Network (R-CNN) approach. A flow-enhanced methodology for object detection is proposed, by adding a new branch to predict an object-level flow field. Following a scheme grounded on neuroscience, a pseudo-temporal motion stream is integrated in parallel to the classification, bounding box regression and segmentation mask prediction branches of Mask R-CNN. Extensive experiments and thorough comparative evaluation provide a detailed analysis of the problem at hand and demonstrate the added value of the involved object-level flow branch. The overall proposed approach achieves improved performance in the six currently broadest and most challenging publicly available semantic urban scene understanding datasets, surpassing the region-based baseline method.&lt;/p&gt;</description>
  </descriptions>
  <fundingReferences>
    <fundingReference>
      <funderName>European Commission</funderName>
      <funderIdentifier funderIdentifierType="Crossref Funder ID">10.13039/501100000780</funderIdentifier>
      <awardNumber awardURI="info:eu-repo/grantAgreement/EC/H2020/787061/">787061</awardNumber>
      <awardTitle>Advanced tools for fighting oNline Illegal TrAfficking</awardTitle>
    </fundingReference>
  </fundingReferences>
</resource>
22
18
views
downloads
Views 22
Downloads 18
Data volume 57.0 MB
Unique views 20
Unique downloads 16

Share

Cite as