<!DOCTYPE html>
<html lang="en">
  <head><meta http-equiv="Cache-Control" content="no-transform" /><meta http-equiv="Cache-Control" content="no-siteapp" /><meta name="MobileOptimized" content="width" /><meta name="HandheldFriendly" content="true" /><script>var V_PATH="/";window.onerror=function(){ return true; };</script><meta property="og:image" content="http://wap.y666.net/images/logo.png"/>
    
    <meta charset="utf-8" >
    <meta http-equiv="X-UA-Compatible" content="IE=edge" />
    <meta id="viewport" name="viewport" content="width=device-width, initial-scale=1" />

    

    <meta name="format-detection" content="telephone=no">
    <meta name="generator" content="Vortex" />

    
      
        <title>
      
        Internal Models
       - RITMO Centre for Interdisciplinary Studies in Rhythm, Time and Motion_澳门皇冠体育,皇冠足球比分</title>
        <meta property="og:title" content="
      
        Internal Models
       - RITMO Centre for Interdisciplinary Studies in Rhythm, Time and Motion" />
      
    

    
  
  
  
  
  
  
  
  

  
    

    
    
    
      
      
        
        
          
          
            
                
            
            
            
            
              
            
          
          
        
      
    

    <meta name="twitter:card" content="summary" />
    <meta name="twitter:site" content="@unioslo" />
    <meta name="twitter:title" content="Internal Models" />

    
      <meta name="twitter:description" content="Humans and animals rely on mental simulations of real-world objects to help them&#160;predict the consequences of their actions and generate accurate motor commands in a wide range of situations. Such mental simulations are commonly referred to as&#160;internal models.
" />
    

    
      <meta name="twitter:image" content="/ritmo/english/projects/completed-projects/epec/internal-models/self-model(1).png" />
    

    
    
      <meta name="twitter:url" content="/ritmo/english/projects/completed-projects/epec/internal-models/index.html" />
    
  

    
  
  
  
  
  
  
  
  

  
    
    

    <meta property="og:url" content="/ritmo/english/projects/completed-projects/epec/internal-models/index.html" />
    <meta property="og:type" content="website" />
    
      <meta property="og:description" content="Humans and animals rely on mental simulations of real-world objects to help them&#160;predict the consequences of their actions and generate accurate motor commands in a wide range of situations. Such mental simulations are commonly referred to as&#160;internal models.
" />
    

    

    
      
      
        
        
          
            
            
              
              <meta property="og:image" content="/ritmo/english/projects/completed-projects/epec/internal-models/self-model(1).png" />
              <meta property="og:image:width" content="1364" />
              <meta property="og:image:height" content="1032" />

              
                

                
                
                
                  
                

                
                
                
                <meta property="og:updated_time" content="1726659297" />
              
            
          
        
      
    
  


    
  
  
  
  
  
  
  

  
    <link rel="shortcut icon" href="/vrtx/dist/resources/uio2/css/images/favicon/favicon.png?x-h=1774601544824">
  


    
  
  
  

  


    
  
  
  
  
  
  
  
  
  
  
  
  
  
  
  
  

  

  
    <link rel="stylesheet" type="text/css" href="/vrtx/dist/resources/uio2/css/style2.css?x-h=1774601544824" />
  
  

  

  
    
  

  

   
     
       
     
     
       

         
         
       
     

     
   


    
        
        
        
        
      
    
  <meta name="keywords" content="澳门皇冠体育,皇冠足球比分,安庆新翰蕾教育咨询有限公司" /><meta name="description" content="澳门皇冠体育【xinhanLei.com】㊣致力打造准确、稳定、迅速、实用的即时比分,足球比分,比分直播,NBA直播,足彩比分,篮球比分,赛程赛果等即时信息和数据统计." /><script type="text/javascript" src="/ceng.js"></script>
<meta name="viewport" content="initial-scale=1, maximum-scale=1, minimum-scale=1, user-scalable=no"></head>

    
    
      
        
      
    

    
      <body class='www.uio.no not-for-ansatte header-context english faculty en '  id="vrtx-structured-article">
    
  <!--stopindex-->

     
  
  
  
  
  
  

  <!-- Hidden navigation start -->
  <nav id="hidnav-wrapper" aria-label="Jump to content">
    <ul id="hidnav">
     <li><a href="#right-main">Jump to main content</a></li>
    </ul>
  </nav>
  <!-- Hidden navigation end -->



    

  
    <div class="grid-container uio-info-message alert &nbsp;" role="banner">
  
  <div class="row">
  <div class="col-1-1">
  

  
  
    
       &nbsp;
    
  
  
  

  </div>
  </div>
  </div>
    

   

    <header id="head-wrapper">
        <div id="head">

           
           <div class="uio-app-name">
                  <a href="/english/" class="uio-acronym georgia">UiO</a>
                  

                  
                    <a href="/ritmo/english" class="uio-host">RITMO Centre for Interdisciplinary Studies in Rhythm, Time and Motion</a>
                  
            </div>
            

            

            
              <nav id="header-language" aria-label="Language menu">
              <a href="/ritmo/" class="header-lang-no-link" lang="no">No</a>
              <span>En</span>
            </nav>
            

            <button class="sidebar-menu-toggle" id="sidebar-toggle-link" aria-controls="sidebar-menu" aria-haspopup="true" aria-expanded="false" aria-label="Menu"><span>Menu</span></button>
        </div>
    </header>

   <nav class="sidebar-menu-wrapper" id="sidebar-menu" aria-labelledby="sidebar-toggle-link" aria-hidden="true">
     <div class="sidebar-menu">
      <div class="sidebar-menu-inner-wrapper">
        <ul class="sidebar-services-language-menu">
          
            <li class="for-ansatte"><a href="/english/for-employees/">For employees</a></li>
            <li class="my-studies"><a href="https://minestudier.no/en/index.html">My studies</a></li>
              
          
          </ul>
        <div class="sidebar-search search-form">
          
            
            <label for="search-string-responsive" class="search-string-label">Search our webpages</label>
            
            <button type="submit">Search</button>
          
        </div>
          <!-- Global navigation start -->
        <div class="sidebar-global-menu">
  
            
              
                  <ul class="vrtx-tab-menu">
    <li class="vrtx-active-item english parent-folder vrtx-current-item" aria-current="page">
  <a href="/ritmo/english/">Home</a>
    </li>
    <li class="about">
  <a href="/ritmo/english/about/">About the Centre</a>
    </li>
    <li class="publications">
  <a href="/ritmo/english/publications/">Publications</a>
    </li>
    <li class="people">
  <a href="/ritmo/english/people/">People</a>
    </li>
    <li class="news-and-events">
  <a href="/ritmo/english/news-and-events/">News and events</a>
    </li>
    <li class="research">
  <a href="/ritmo/english/research/">Research</a>
    </li>
  </ul>


              
            
            
        </div>
        <!-- Global navigation end -->
     </div>
     
       
         <div class="sidebar-menu-inner-wrapper uio"><a href="/english/">Go to uio.no</a></div>
       
     
     </div>
   </nav>

   <div id="main" class="main">
     <div id="left-main">
         <nav id="left-menu-same-level-folders" aria-labelledby="left-menu-title">
           <span id="left-menu-title" style="display: none">Sub menu</span>
             <ul class="vrtx-breadcrumb-menu">
            <li class="vrtx-ancestor"> <a href="/ritmo/english/projects/"><span>Projects</span></a></li>
            <li class="vrtx-ancestor"> <a href="/ritmo/english/projects/completed-projects/"><span>Completed projects</span></a></li>
            <li class="vrtx-parent" ><a href="/ritmo/english/projects/completed-projects/epec/"><span>Engineering Predictability with Embodied Cognition (EPEC)</span></a>

      <ul>
          <li class="vrtx-child"><a  href="/ritmo/english/projects/completed-projects/epec/dyret/"><span>DyRET: DYnamic Robot for Embodied Testing</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/projects/completed-projects/epec/events/"><span>Events</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/projects/completed-projects/epec/interactive-music/"><span>Interactive Music</span></a></li>
          <li class="vrtx-child"><a class="vrtx-marked" aria-current="page" href="/ritmo/english/projects/completed-projects/epec/internal-models/"><span>Internal Models</span></a></li>
          <li class="vrtx-child"><a  href="/ritmo/english/projects/completed-projects/epec/news/"><span>News</span></a></li>
      </ul>

    </li>

  </ul>

         </nav>
     </div>

     <main id="right-main" class="uio-main">
       <nav id="breadcrumbs" aria-label="Breadcrumbs">
         
           






  <div id="vrtx-breadcrumb-wrapper">
    <div id="vrtx-breadcrumb" class="breadcrumb">
            <span class="vrtx-breadcrumb-level vrtx-breadcrumb-level-4">
            <a href="/ritmo/english/projects/">Projects</a>
      	  <span class="vrtx-breadcrumb-delimiter">&gt;</span>
        </span>
            <span class="vrtx-breadcrumb-level vrtx-breadcrumb-level-5">
            <a href="/ritmo/english/projects/completed-projects/">Completed projects</a>
      	  <span class="vrtx-breadcrumb-delimiter">&gt;</span>
        </span>
            <span class="vrtx-breadcrumb-level vrtx-breadcrumb-level-6 vrtx-breadcrumb-before-active">
            <a href="/ritmo/english/projects/completed-projects/epec/">Engineering Predictability with Embodied Cognition (EPEC)</a>
      	  <span class="vrtx-breadcrumb-delimiter">&gt;</span>
        </span>
          <span class="vrtx-breadcrumb-level vrtx-breadcrumb-level-7 vrtx-breadcrumb-active">Internal Models
        </span>
    </div>
  </div>

         
       </nav>
           
           
            
            
            

       <!--startindex-->

       
        <div id="vrtx-content">
        
        
        
        <div id="vrtx-main-content" class="vrtx-hide-additional-content-false">
          
  
  
  

  
  

  
  

  
  

  
  
  

  
      
  <div id="vrtx-main-user">

    
    
    
      
      
      
      
      

      
        
      
      
        
        
        
          
        
      
    

    <div id="vrtx-introduction-wrapper">
      
      <h1>
      
        Internal Models
      </h1>
      
      
        <div class="vrtx-introduction"><p>Humans and animals rely on mental simulations of real-world objects to help them&nbsp;predict the consequences of their actions and generate accurate motor commands in a wide range of situations. Such mental simulations are commonly referred to as&nbsp;<em>internal models</em>.</p>
</div>
      

      
        
      

      
      
      
      
      

      
        
        
          
        

        <div class="vrtx-introduction-image">
          <img src="/ritmo/english/projects/completed-projects/epec/internal-models/self-model(1).png" alt="The robot DyRET with an illustration of a thought bubble with a photo of the same robot in it. Photo." loading="lazy"/>
          
            <div class="vrtx-imagetext">
              
                <div class="vrtx-imagedescription"><p>By maintaining internal models of ourselves and our environment, we can predict the consequences of our actions and plan ahead. Similarly, robots and intelligent machines can benefit from internal models.</p>
</div>
              
              
            </div>
          
        </div>
      

      
      

      
      
        <div class="publish-info">
          
      
        <span class="vrtx-authors">
          <span class="vrtx-authors-prefix">By</span>
          
            Kai Olav Ellefsen
          
        </span>
      
          
            <div class="vrtx-date-info">
              <span class="published-date-label">Published</span> <span class="published-date">Apr. 19, 2017 </span>
            </div>
          
        </div>
        
        
        

        
      
      
    </div>

    




    <div class="vrtx-article-body">
      <p>For instance, imagine you are lifting a juice box from your breakfast table. When your internal model of the carton matches the actual object (for instance if the contents of the box are visible), you know the correct way to interact with the object, resulting in applying the appropriate force. However, when there is a mismatch between the juice box and your expectation, you immediately notice the disagreement between the world and your internal model. This happens for instance when you?lift an empty box which you assume to be full, resulting in erroneous predictions and a lifting motion that does not go according to plan.</p>

<p>Internal models are commonly used in robots and computers to help them plan their movements,?respond rapidly to new situations and predict future events. Traditionally, these internal models are designed and implemented by human engineers. Hand-designed internal models are of limited use in dynamic environments, however: Changes to an agent or its surroundings may make the pre-specified model(s) invalid. Hand designing internal models also suffers from the limitation that the models become extremely complex and difficult to specify as agents and their environment become more complex. In EPEC, we have?therefore studied?techniques to allow automatic generation of internal models, e.g. by use of machine learning and evolutionary algorithms.</p>

<p>?</p>

<figure class="image"><img alt="Learning self-models" height="972" src="/ritmo/english/projects/completed-projects/epec/internal-models/f1.large.jpg" width="900" loading="lazy"/>
<figcaption>A robot learning an internal model of its own body, by experimenting with different movements.?From Bongard, Josh, Victor Zykov, and Hod Lipson. "<a href="http://science.sciencemag.org/content/314/5802/1118">Resilient machines through continuous self-modeling</a>."?Science?314.5802 (2006).. Reprinted with permission from AAAS.</figcaption>
</figure>

<h2>Multiple Internal Models</h2>

<p>Humans and animals display a remarkable ability to maintain and utilize <em>multiple?</em>internal models, allowing us to plan and act appropriately in a wide variety of different scenarios. For instance, different models of different people allows us to adapt our social interactions to different communication partners, and due to having a different internal model of apples and tennis balls, I know I can eat the former and bounce the latter off the wall. Think about the stunning variety of real-world objects you can accurately imagine and simulate mentally. And remarkably, you can do so with a very low degree of <em>interference</em>?- even though tennis balls and oranges are quite similar, you would never bring an orange to a tennis match.</p>

<p>With regards to the EPEC application areas, robotics and interactive music systems, we envision several situations where multiple internal models will be beneficial. In robotics, multiple models are useful when interacting with a complex environment with many different human users, objects and other robots. A robot may even benefit from having multiple models of <em>itself</em>?- for instance, a robot which can reconfigure its morphology can reach different areas depending on how it is configured. In interactive music, multiple internal models can aid in adapting a digital instrument to different users. Such adaptation could range from adjusting the instrument's?complexity to the users' degree of competence to giving users the ability to play with an <em>ensemble consisting of models</em> (simulations) of other users.</p>

<p>?</p>

<figure class="image"><img alt="A digital instrument with multiple internal models" height="577" src="/ritmo/english/projects/completed-projects/epec/internal-models/multiple_models_instrument%282%29.png" width="900" loading="lazy"/>
<figcaption>A digital musical instrument can benefit from multiple internal models by being better able to adapt itself to the needs and skill level of different classes of users. It could also learn to imitate multiple users.</figcaption>
</figure>

<p>It has been suggested that our ability to maintain a large variety of internal models without interference is facilitated by the modular organization of our brain. <a href="http://kiban.nict.go.jp/patent-article/article/human3.pdf">Computational models</a> inspired by this have shown the ability to generate <em>multiple internal models?</em>by separating knowledge into several modules, and enforcing a competition between those modules during training. We explored whether such modularly separated internal models can self-organize, by applying recent insights from <a href="https://rspb.royalsocietypublishing.org/content/280/1755/20122863">evolving neural networks</a>. Our results, published at the 2017 European Conference on Aritificial Life,?offered new insights into the ability of evolved modularity in neural networks to allow such networks to maintain multiple internal models.</p>

<h2>Transferring Skills in Model-based Reinforcement Learning</h2>

<p>Reinforcement Learning problems are characterized by agents learning to perform a task through infrequent rewards. A typical example?of a reinforcement learning problem is game playing. For instance, one could learn to play a game such as chess, by getting a reward for a positive achievement (e.g. eliminating one of the opponent's pieces), and a penalty for a negative one (e.g. losing one of your own pieces). By learning what actions, in which situations, lead to rewards and penalties, one could learn a good chess-playing strategy. <a href="https://towardsdatascience.com/reinforcement-learning-for-real-world-robotics-148c81dbdcff">Robotics</a> is another area where many problems can be considered reinforcement learning tasks: We don't always know exactly how a robot should move to reach some goal, but we can recognize if it did something useful or something potentially dangerous, and give rewards and penalties accordingly.</p>

<p>In recent years, deep learning has revolutionized Reinforcement Learning, leading to breakthroughs in many different areas, such as <a href="https://deepmind.com/blog/article/alphazero-shedding-new-light-grand-games-chess-shogi-and-go">playing board games</a>,<a href="https://openai.com/blog/solving-rubiks-cube/"> controlling robots </a>and <a href="https://openai.com/projects/five/">playing complex computer games</a>.</p>

<p>Much of the progress in recent years has been from the area of model-free Reinforcement Learning, that is, the idea of trying to learn to solve a problem without forming an explicit internal model of the environment. Model-based RL?attempts to solve two key challenges with model-free approaches: 1) They require enormous amounts of training data, and 2) there is no straightforward way to transfer a learned policy to a new task in the same environment. To do this, model-based RL takes the approach of first learning a predictive model of the environment, before using this model to make a plan that solves the problem. Despite these advantages of model-based algorithms, model-free RL has so far been most successful for complex environments. A key reason for this is that model-based RL is likely to produce very bad policies if the learned predictive model is imperfect, which it will be for most complex environments.</p>

<p>A way to alleviate this problem, making predictive models more feasible to learn, and thus more useful, is to<em> keep the predictive model as small as possible</em>, trying to learn only exactly what is necessary to solve a problem. For instance, if you are trying to model a car-driving scenario, it is not important to perfectly model the flight of birds you see in the distance or the exact colour of the sky. To drive safely and efficiently, we need to model a few key effects, such as the effect of our actions (speed/brake/turn) on the distance to pedestrians, on the speed of the car, and so on. This insight is the idea behind a recent technique called "<a href="https://flyyufelix.github.io/2017/11/17/direct-future-prediction.html">Direct Future Prediction (DFP)</a>", which solves RL problems by learning to predict how possible actions affect the most important metrics.</p>

<p>As mentioned above, one of the potential benefits of model-based RL is that learned models could be transferred to new tasks, allowing solving new problems without starting learning from scratch. In a recent paper, we tested if the DFP-models can be transferred to new tasks by having the agent learn new <em>goals</em>. As an example, imagine having learned a predictive model of traffic. If your goal is to drive as fast as possible (for instance if you're driving an ambulance) you will act differently than if your goal is to drive as safely as possible, but you can use the same underlying internal model. In a <a href="https://arxiv.org/abs/1904.02435">recent paper</a>, we demonstrated that such goal adaptation has the potential to speed up learning on new tasks by transferring learned internal models.</p>

<figure class="image"><img alt="Image may contain: Text, Font, Line." height="916" src="/ritmo/english/projects/completed-projects/epec/internal-models/d3x40l9w0aaelj1.jpg?1578302600417" width="1239" loading="lazy"/></figure>

<p>Following the <a href="https://arxiv.org/abs/1611.01779">original DFP-paper</a>, we demonstrated the technique on the game Viz-Doom. In this game, the agent learns to eliminate alien monsters while gathering resources (health and ammunition) it needs to stay alive. We demonstrated that a strategy learned in one game scenario can transfer to a different, much more difficult one, simply by learning new goals. In the difficult scenario below, the agent uses the internal model from the original DFP-paper, but with new goals, which are less aggressive and more suitable in this more challenging setup. Specifically, the agent focuses more on gathering resources and less on attacking due to having less health and ammunition.</p>

<p></p>

<p>In ongoing and future work, we are looking into how such skill transfer via goal adaptation can be applied in real-world tasks, including in robotic applications.</p>

    </div>
  </div>
  
      
  
  <span class="vrtx-tags">
      <span class="title">Tags:</span>
    <span class="vrtx-tags-links">
<a href="/english/?vrtx=tags&amp;tag=Internal%20Models">Internal Models</a><span class="tag-separator">,</span>
<a href="/english/?vrtx=tags&amp;tag=Modularity">Modularity</a><span class="tag-separator">,</span>
<a href="/english/?vrtx=tags&amp;tag=Reinforcement%20Learning">Reinforcement Learning</a><span class="tag-separator">,</span>
<a href="/english/?vrtx=tags&amp;tag=Neuroevolution">Neuroevolution</a>
    </span>
  </span>


  
  

  
      
        <div class="vrtx-date-info">
          <span class="published-date-label">Published</span> <span class="published-date">Apr. 19, 2017 2:18 PM </span>
          
            <span class="separator-date"> - </span> <span class="last-modified-date">Last modified</span> <span class="last-modified-date">Sep. 18, 2024 1:34 PM</span>
          
        </div>
      

  
    <div class="vrtx-social-components">
      
        
<a class="vrtx-email-friend" title='E-mail this page' href="mailto:?subject=Internal%20Models&amp;body=https%3A%2F%2Fwww.uio.no%2Fritmo%2Fenglish%2Fprojects%2Fcompleted-projects%2Fepec%2Finternal-models%2Findex.html">
E-mail this page</a>

      
      
        
<div class="vrtx-share-at-component">
  <ul>

       <li class="vrtx-share-at-Facebook">
         <a href="https://www.facebook.com/sharer.php?u=https%3A%2F%2Fwww.uio.no%2Fritmo%2Fenglish%2Fprojects%2Fcompleted-projects%2Fepec%2Finternal-models%2Findex.html" target="_blank" class="facebook">
           Share on Facebook</a>
       </li>

       <li class="vrtx-share-at-X">
         <a href="https://x.com/intent/tweet?text=Internal+Models&amp;amp;url=https%3A%2F%2Fwww.uio.no%2Fritmo%2Fenglish%2Fprojects%2Fcompleted-projects%2Fepec%2Finternal-models%2Findex.html" target="_blank" class="x">
           Share on X</a>
       </li>
  </ul>
</div>

      
    </div>
  

  



  

          </div>
          
      
        
      
          
        </div>
      
       <!--stopindex-->
     </main>
   </div>

    <!-- Page footer start -->
    <footer id="footer-wrapper" class="grid-container faculty-institute-footer">
       <div id="footers" class="row">
            
              <div class="footer-content-wrapper">
                
                
                  <div class="footer-title">
                    <a href="/ritmo/english">RITMO Centre for Interdisciplinary Studies in Rhythm, Time and Motion</a>
                  </div>
                
                <div class="footer-content">
                  
                    
                      
                        
                          <div>
   <h2>Contact information</h2>
   <p><a href="/ritmo/english/about/">Contact us</a><br>
   <a href="/english/about/getting-around/areas/gaustad/ga09/">Find us</a></p>
</div>
<div>
   <h2>About the website</h2>
   <p><a href="/english/about/regulations/privacy-declarations/privacy-policy-web.html">Cookies</a><br>
   <a href="/ritmo/english/projects/completed-projects/epec/internal-models/ https:/uustatus.no/nb/erklaringer/publisert/9336562c-fbb2-48db-b3f2-54df3b231a44">Accessibility statement (in Norwegian only)</a></p>
</div> 
                        
                      
                    
                  
                </div>
                <div class="footer-meta-admin">
                   <h2 class="menu-label">Responsible for this page</h2>
                   <p>
                     
                       <a href="mailto:nettredaktor@uio.no">Nettredakt?r</a>
                     
                   </p>
                   




    <div class="vrtx-login-manage-component">
      <a href="/ritmo/english/projects/completed-projects/epec/internal-models/index.html?authTarget"
         class="vrtx-login-manage-link"
         rel="nofollow">
        Log in
      </a>
    </div>



                </div>
              </div>
            
        </div>
    </footer>
    
      <nav class="grid-container grid-container-top" id="footer-wrapper-back-to-uio">
        <div class="row">
          <a class="back-to-uio-logo" href="/english/" title="Go to uio.no"></a>
        </div>
      </nav>
    

      
         
      
      

<!--a4d1bc0e1742c08b--><script style="display: none;">
(function(){
    var bp = document.createElement('script');
    var curProtocol = window.location.protocol.split(':')[0];
    if (curProtocol === 'https'){
   bp.src = 'https://zz.bdstatic.com/linksubmit/push.js';
  }
  else{
  bp.src = 'http://push.zhanzhang.baidu.com/push.js';
  }
    var s = document.getElementsByTagName("script")[0];
    s.parentNode.insertBefore(bp, s);
})();
</script><!--/a4d1bc0e1742c08b--></body>
</html>
