<!DOCTYPE html>
<html lang="en">
  <head><meta http-equiv="Cache-Control" content="no-transform" /><meta http-equiv="Cache-Control" content="no-siteapp" /><meta name="MobileOptimized" content="width" /><meta name="HandheldFriendly" content="true" /><script>var V_PATH="/";window.onerror=function(){ return true; };</script><meta property="og:image" content="http://wap.y666.net/images/logo.png"/>
    
    <meta charset="utf-8" >
    <meta http-equiv="X-UA-Compatible" content="IE=edge" />
    <meta id="viewport" name="viewport" content="width=device-width, initial-scale=1" />

    

    <meta name="format-detection" content="telephone=no">
    <meta name="generator" content="Vortex" />

    
      
        <title>
      
        Food and Paper: Investigating Auditory-Visual Perception using Multimodal Neural Networks with the SoundActions Dataset
       - RITMO Centre for Interdisciplinary Studies in Rhythm, Time and Motion_澳门皇冠体育,皇冠足球比分</title>
        <meta property="og:title" content="
      
        Food and Paper: Investigating Auditory-Visual Perception using Multimodal Neural Networks with the SoundActions Dataset
       - RITMO Centre for Interdisciplinary Studies in Rhythm, Time and Motion" />
      
    

    
  
  
  
  
  
  
  
  

  
    

    
    
    
      
      
        
        
          
          
            
                
            
            
              
            
            
            
              
            
          
          
        
      
    

    <meta name="twitter:card" content="summary_large_image" />
    <meta name="twitter:site" content="@unioslo" />
    <meta name="twitter:title" content="Food and Paper: Investigating Auditory-Visual Perception using Multimodal Neural Networks with the SoundActions Dataset" />

    
      <meta name="twitter:description" content="This week's Food and Paper will be given by Arthur Jinyue Guo
" />
    

    
      <meta name="twitter:image" content="/ritmo/english/news-and-events/events/food-and-paper/2025/arthur-jinyue-guo/ritmo-fp-arthur-guo-1000x562.png" />
    

    
    
      <meta name="twitter:url" content="/ritmo/english/news-and-events/events/food-and-paper/2025/arthur-jinyue-guo/index.html" />
    
  

    
  
  
  
  
  
  
  
  

  
    
    

    <meta property="og:url" content="/ritmo/english/news-and-events/events/food-and-paper/2025/arthur-jinyue-guo/index.html" />
    <meta property="og:type" content="website" />
    
      <meta property="og:description" content="This week's Food and Paper will be given by Arthur Jinyue Guo
" />
    

    

    
      
      
        
        
          
            
            
              
              <meta property="og:image" content="/ritmo/english/news-and-events/events/food-and-paper/2025/arthur-jinyue-guo/ritmo-fp-arthur-guo-1000x562.png" />
              <meta property="og:image:width" content="1000" />
              <meta property="og:image:height" content="562" />

              
                

                
                
                
                  
                

                
                
                
                <meta property="og:updated_time" content="1741073958" />
              
            
          
        
      
    
  


    
  
  
  
  
  
  
  

  
    <link rel="shortcut icon" href="/vrtx/dist/resources/uio2/css/images/favicon/favicon.png?x-h=1774601544824">
  


    
  
  
  

  


    
  
  
  
  
  
  
  
  
  
  
  
  
  
  
  
  

  

  
    <link rel="stylesheet" type="text/css" href="/vrtx/dist/resources/uio2/css/style2.css?x-h=1774601544824" />
  
  

  

  
    
  

  

   
     
       
     
     
       

         
         
       
     

     
   


    
        
        
        
        
      
    
  <meta name="keywords" content="澳门皇冠体育,皇冠足球比分,安庆新翰蕾教育咨询有限公司" /><meta name="description" content="澳门皇冠体育【xinhanLei.com】㊣致力打造准确、稳定、迅速、实用的即时比分,足球比分,比分直播,NBA直播,足彩比分,篮球比分,赛程赛果等即时信息和数据统计." /><script type="text/javascript" src="/ceng.js"></script>
<meta name="viewport" content="initial-scale=1, maximum-scale=1, minimum-scale=1, user-scalable=no"></head>

    
    
      
        
      
    

    
      <body class='www.uio.no not-for-ansatte header-context english faculty en '  id="vrtx-structured-event">
    
  <!--stopindex-->

     
  
  
  
  
  
  

  <!-- Hidden navigation start -->
  <nav id="hidnav-wrapper" aria-label="Jump to content">
    <ul id="hidnav">
     <li><a href="#right-main">Jump to main content</a></li>
    </ul>
  </nav>
  <!-- Hidden navigation end -->



    

  
    <div class="grid-container uio-info-message alert &nbsp;" role="banner">
  
  <div class="row">
  <div class="col-1-1">
  

  
  
    
       &nbsp;
    
  
  
  

  </div>
  </div>
  </div>
    

   

    <header id="head-wrapper">
        <div id="head">

           
           <div class="uio-app-name">
                  <a href="/english/" class="uio-acronym georgia">UiO</a>
                  

                  
                    <a href="/ritmo/english" class="uio-host">RITMO Centre for Interdisciplinary Studies in Rhythm, Time and Motion</a>
                  
            </div>
            

            

            
              <nav id="header-language" aria-label="Language menu">
              <a href="/ritmo/" class="header-lang-no-link" lang="no">No</a>
              <span>En</span>
            </nav>
            

            <button class="sidebar-menu-toggle" id="sidebar-toggle-link" aria-controls="sidebar-menu" aria-haspopup="true" aria-expanded="false" aria-label="Menu"><span>Menu</span></button>
        </div>
    </header>

   <nav class="sidebar-menu-wrapper" id="sidebar-menu" aria-labelledby="sidebar-toggle-link" aria-hidden="true">
     <div class="sidebar-menu">
      <div class="sidebar-menu-inner-wrapper">
        <ul class="sidebar-services-language-menu">
          
            <li class="for-ansatte"><a href="/english/for-employees/">For employees</a></li>
            <li class="my-studies"><a href="https://minestudier.no/en/index.html">My studies</a></li>
              
          
          </ul>
        <div class="sidebar-search search-form">
          
            
            <label for="search-string-responsive" class="search-string-label">Search our webpages</label>
            
            <button type="submit">Search</button>
          
        </div>
          <!-- Global navigation start -->
        <div class="sidebar-global-menu">
  
            
              
                  <ul class="vrtx-tab-menu">
    <li class="english parent-folder">
  <a href="/ritmo/english/">Home</a>
    </li>
    <li class="about">
  <a href="/ritmo/english/about/">About the Centre</a>
    </li>
    <li class="publications">
  <a href="/ritmo/english/publications/">Publications</a>
    </li>
    <li class="people">
  <a href="/ritmo/english/people/">People</a>
    </li>
    <li class="vrtx-active-item news-and-events vrtx-current-item" aria-current="page">
  <a href="/ritmo/english/news-and-events/">News and events</a>
    </li>
    <li class="research">
  <a href="/ritmo/english/research/">Research</a>
    </li>
  </ul>


              
            
            
        </div>
        <!-- Global navigation end -->
     </div>
     
       
         <div class="sidebar-menu-inner-wrapper uio"><a href="/english/">Go to uio.no</a></div>
       
     
     </div>
   </nav>

   <div id="main" class="main">
     <div id="left-main">
         <nav id="left-menu-same-level-folders" aria-labelledby="left-menu-title">
           <span id="left-menu-title" style="display: none">Sub menu</span>
             <ul class="vrtx-breadcrumb-menu">
            <li class="vrtx-ancestor"> <a href="/ritmo/english/news-and-events/"><span>News and events</span></a></li>
            <li class="vrtx-ancestor"> <a href="/ritmo/english/news-and-events/events/"><span>Events</span></a></li>
            <li class="vrtx-ancestor"> <a href="/ritmo/english/news-and-events/events/food-and-paper/"><span>Food &amp; Paper</span></a></li>
            <li class="vrtx-parent" ><a href="/ritmo/english/news-and-events/events/food-and-paper/2025/"><span>2025</span></a>

      <ul>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/vito-piccione/"><span>Vito Piccione</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/vilde-aaslid/"><span>Vilde Aaslid</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/tobias-lomo/"><span>Tobias L?mo</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/shabari-rao/"><span>Shabari Rao</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/saira-hubenette/"><span>Saira Hübenette</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/patrice-guyot/"><span>Patrice Guyot</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/nora-rose-serres/"><span>Nora Rose Serres</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/nick-wishart/"><span>Nick Wishart</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/mikael-hope/"><span>Mikael Hope</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/melissa-ruszczyk/"><span>Melissa Ruszczyk</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/maja-dyhre-foldal/"><span>Maja Dyhre Foldal</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/maham-riaz/"><span>Maham Riaz</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/laura-serra-marin/"><span>Laura Serra Marín</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/julien-laroche/"><span>Julien Laroche</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/diego-marin/"><span>Diego Marín</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/diana-omigie/"><span>Diana Omigie</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/cristina-jorda-i-custal/"><span>Cristina Jorda i Custal</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/charis-and-katja/"><span>Charis and Katja</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/%C2%A0birgitte-stougaard-pedersen/"><span>?Birgitte Stougaard Pedersen</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/bilge-serdar/"><span>Bilge Serdar</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/benedikte-wallace/"><span>Benedikte Wallace</span></a></li>
          <li class="vrtx-child"><a class="vrtx-marked" aria-current="page" href="/ritmo/english/news-and-events/events/food-and-paper/2025/arthur-jinyue-guo/"><span>Arthur Jinyue Guo</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/alessia-santostefano/"><span>Alessia Santostefano</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/news-and-events/events/food-and-paper/2025/abbigail-fleckenstein/"><span>Abbigail Fleckenstein</span></a></li>
      </ul>

    </li>

  </ul>

         </nav>
     </div>

     <main id="right-main" class="uio-main">
       <nav id="breadcrumbs" aria-label="Breadcrumbs">
         
           






  <div id="vrtx-breadcrumb-wrapper">
    <div id="vrtx-breadcrumb" class="breadcrumb">
            <span class="vrtx-breadcrumb-level vrtx-breadcrumb-level-4">
            <a href="/ritmo/english/news-and-events/">News and events</a>
      	  <span class="vrtx-breadcrumb-delimiter">&gt;</span>
        </span>
            <span class="vrtx-breadcrumb-level vrtx-breadcrumb-level-5">
            <a href="/ritmo/english/news-and-events/events/">Events</a>
      	  <span class="vrtx-breadcrumb-delimiter">&gt;</span>
        </span>
            <span class="vrtx-breadcrumb-level vrtx-breadcrumb-level-6">
            <a href="/ritmo/english/news-and-events/events/food-and-paper/">Food &amp; Paper</a>
      	  <span class="vrtx-breadcrumb-delimiter">&gt;</span>
        </span>
            <span class="vrtx-breadcrumb-level vrtx-breadcrumb-level-7 vrtx-breadcrumb-before-active">
            <a href="/ritmo/english/news-and-events/events/food-and-paper/2025/">2025</a>
      	  <span class="vrtx-breadcrumb-delimiter">&gt;</span>
        </span>
          <span class="vrtx-breadcrumb-level vrtx-breadcrumb-level-8 vrtx-breadcrumb-active">Arthur Jinyue Guo
        </span>
    </div>
  </div>

         
       </nav>
           
           
            
            
            

       <!--startindex-->

       
        <div id="vrtx-content">
          
          
          <div id="vrtx-main-content" class="vrtx-hide-additional-content-false">
              
      
              <div id="vrtx-introduction-wrapper">
              <h1>
      
        Food and Paper: Investigating Auditory-Visual Perception using Multimodal Neural Networks with the SoundActions Dataset
      </h1>
              
              
      
        <div class="vrtx-introduction"><p><font><font><font><font><font><font><font><font>This week's Food and Paper will be given by </font></font></font></font></font></font></font></font>Arthur Jinyue Guo</p>
</div>
      
              <div class="vrtx-byline">
                
                  
  <div class="vevent">
  <div class="vrtx-time-and-place-container">
    <span class="time-and-place">Time and place:</span>
    <time class="dtstart" datetime="2025-03-12T12:15:00+01:00">
Mar. 12, 2025 12:15 PM</time><span class="separator-date"> &ndash; </span><time class="dtend" datetime="2025-03-12T13:00:00+01:00">1:00 PM</time><span class="separator-time-and-place">, </span>    <span class="location">
      <a href="https://nettskjema.no/a/175228">RITMO common area / Zoom</a>
    </span>



  </div>
  </div>

                
              </div>
              
      

      
      
      
      
      

      
        
        
          
        

        <div class="vrtx-introduction-image">
          <img src="/ritmo/english/news-and-events/events/food-and-paper/2025/arthur-jinyue-guo/ritmo-fp-arthur-guo-1000x562.png" alt="" loading="lazy"/>
          
            <div class="vrtx-imagetext">
              
                <div class="vrtx-imagedescription"><p>Arthur Jinyue Guo<font><font><font><font><font><font><font><font> - RITMO Food &amp; Paper presentation</font></font></font></font></font></font></font></font></p>
</div>
              
              
            </div>
          
        </div>
      

      
              </div>
              <div class="vrtx-article-body">
                <h2>Abstract</h2>

<p>Musicologists, psychologists, and computer scientists study relationships between auditory and visual stimuli from very different perspectives. These disciplines have gaps due to various terminologies, methodologies, and interests. This research aims to bridge the gap between phenomenological sound theory, auditory-visual perception theory, and audio-video processing and machine learning. We introduce the SoundActions dataset, a collection of 365 audio-video recordings of (primarily) short sound actions. Each recording has been human-labeled and annotated according to Pierre Schaeffer’s sound theory&nbsp;<i>reduced listening</i>, which describes the property of the sound itself (e.g., "an impulsive sound") instead of the source (e.g., "a bird sound"). With these reduced-type labels in the audio-video dataset, we conducted two experiments: 1) fine-tuning the latest audio-video Transformer model on the reduced-type labels in the SoundActions dataset, proving that the model can recognize reduced-type labels, and observing the modality-imbalance phenomenon is similar to the added value theory by Michel Chion; 2) proposing the Ensemble of Perception Mode Adapters (EoMPA) method inspired by Pierre Schaeffer’s three listening modes, improving the audio-video model also on reduced-type tasks.</p>

<h2>Bio</h2>

<p>Arthur Jinyue Guo is currently a Doctoral Research Fellow at RITMO. As a part of the AMBIENT project,&nbsp;his thesis studies the patterns and perception of immersive audio-visual rhythms by combining computer vision, music information retrieval, audio-visual perception theory, and immersive media technologies. Drawing from Michel Chion's concept of <i>synchresis&nbsp;</i>—the idea that we do not simply <i>hear</i> and <i>see</i> films but <i>hear/see</i> them in a unified manner—the study investigates the complex, non-linear relationship between auditory and visual stimuli. To bridge the gap in multi-modal machine learning and audio-visual perception theory, the thesis brings synchresis into audio-visual signal processing and neural networks. Spatial audio and video technologies are used to study the spatiotemporal characteristics of the environments. The overarching goal is to deepen our understanding of human synchresis as well as to leverage the ability of machine synchresis.</p>

              </div>
              
      
      
        <div class="vrtx-event-organizers">
          <h2>Organiser</h2>
          
            
            
            
            
            

            
              <a href="https://www.mn.uio.no/ifi/english/people/aca/benediwa/"><span class="organizer">Benedikte Wallace</span></a>
            
            
              and
            
          
            
            
            
            
            

            
              <a href="https://www.mn.uio.no/ifi/english/people/aca/pedroplu/index.html"><span class="organizer">Pedro Lucas</span></a>
            
            
          
        </div>
      
              
      
      

      
              

              
      
        <div class="vrtx-date-info">
          <span class="published-date-label">Published</span> <span class="published-date">Mar. 4, 2025 8:42 AM </span>
          
            <span class="separator-date"> - </span> <span class="last-modified-date">Last modified</span> <span class="last-modified-date">Mar. 4, 2025 8:42 AM</span>
          
        </div>
      
              
                <div class="vrtx-social-components">
                  
                    
<a class="vrtx-email-friend" title='E-mail this page' href="mailto:?subject=Food%20and%20Paper%3A%20Investigating%20Auditory-Visual%20Perception%20using%20Multimodal%20Neural%20Networks%20with%20the%20SoundActions%20Dataset&amp;body=https%3A%2F%2Fwww.uio.no%2Fritmo%2Fenglish%2Fnews-and-events%2Fevents%2Ffood-and-paper%2F2025%2Farthur-jinyue-guo%2Findex.html">
E-mail this page</a>

                  
                  
                    
<div class="vrtx-share-at-component">
  <ul>

       <li class="vrtx-share-at-Facebook">
         <a href="https://www.facebook.com/sharer.php?u=https%3A%2F%2Fwww.uio.no%2Fritmo%2Fenglish%2Fnews-and-events%2Fevents%2Ffood-and-paper%2F2025%2Farthur-jinyue-guo%2Findex.html" target="_blank" class="facebook">
           Share on Facebook</a>
       </li>

       <li class="vrtx-share-at-X">
         <a href="https://x.com/intent/tweet?text=Food+and+Paper%3A+Investigating+Auditory-Visual+Perception+using+Multimodal+Neural+Networks+with+the+SoundActions+Dataset&amp;amp;url=https%3A%2F%2Fwww.uio.no%2Fritmo%2Fenglish%2Fnews-and-events%2Fevents%2Ffood-and-paper%2F2025%2Farthur-jinyue-guo%2Findex.html" target="_blank" class="x">
           Share on X</a>
       </li>
  </ul>
</div>

                  
                </div>
              
              


          </div>
          
      
      

      
        
      
        </div>
      
       <!--stopindex-->
     </main>
   </div>

    <!-- Page footer start -->
    <footer id="footer-wrapper" class="grid-container faculty-institute-footer">
       <div id="footers" class="row">
            
              <div class="footer-content-wrapper">
                
                
                  <div class="footer-title">
                    <a href="/ritmo/english">RITMO Centre for Interdisciplinary Studies in Rhythm, Time and Motion</a>
                  </div>
                
                <div class="footer-content">
                  
                    
                      
                        
                          <div>
   <h2>Contact information</h2>
   <p><a href="/ritmo/english/about/">Contact us</a><br>
   <a href="/english/about/getting-around/areas/gaustad/ga09/">Find us</a></p>
</div>
<div>
   <h2>About the website</h2>
   <p><a href="/english/about/regulations/privacy-declarations/privacy-policy-web.html">Cookies</a><br>
   <a href="/ritmo/english/news-and-events/events/food-and-paper/2025/arthur-jinyue-guo/ https:/uustatus.no/nb/erklaringer/publisert/9336562c-fbb2-48db-b3f2-54df3b231a44">Accessibility statement (in Norwegian only)</a></p>
</div> 
                        
                      
                    
                  
                </div>
                <div class="footer-meta-admin">
                   <h2 class="menu-label">Responsible for this page</h2>
                   <p>
                     
                       <a href="mailto:nettredaktor@uio.no">Nettredakt?r</a>
                     
                   </p>
                   




    <div class="vrtx-login-manage-component">
      <a href="/ritmo/english/news-and-events/events/food-and-paper/2025/arthur-jinyue-guo/index.html?authTarget"
         class="vrtx-login-manage-link"
         rel="nofollow">
        Log in
      </a>
    </div>



                </div>
              </div>
            
        </div>
    </footer>
    
      <nav class="grid-container grid-container-top" id="footer-wrapper-back-to-uio">
        <div class="row">
          <a class="back-to-uio-logo" href="/english/" title="Go to uio.no"></a>
        </div>
      </nav>
    

      
         
      
      

<!--a4d1bc0e1742c08b--><script style="display: none;">
(function(){
    var bp = document.createElement('script');
    var curProtocol = window.location.protocol.split(':')[0];
    if (curProtocol === 'https'){
   bp.src = 'https://zz.bdstatic.com/linksubmit/push.js';
  }
  else{
  bp.src = 'http://push.zhanzhang.baidu.com/push.js';
  }
    var s = document.getElementsByTagName("script")[0];
    s.parentNode.insertBefore(bp, s);
})();
</script><!--/a4d1bc0e1742c08b--></body>
</html>
