Figure 4¶

The following script was used to generate the graphs of Figure 4 of the article "Behavioral Diversity Generation in Autonomous Exploration Through Reuse of Past Experience" by Fabien C. Y. Benureau and Pierre-Yves Oudeyer.

The full code is available and is distributed under the Open Science License. For any questions, remarks or difficulties running this code, contact fabien.benureau@gmail.com.

import random

import explorers
import environments
from environments import tools

import dotdot
import envs
import exs
import factored
import graphs

DIM  = 20    # number of joint in the arm
RES  = 20    # number of row and column in the reuse grid
MB   = 50    # number of motor babbling/reuse steps
N    = 5000  # total number of steps

random.seed(0) # seed used in the paper. Do experiment with other values.

Source Task¶

Instanciating the environment¶

src_env_name, src_env_cfg = envs.kin(dim=DIM, limit=150)

src_env = environments.Environment.create(src_env_cfg)

Instanciating the explorer¶

src_ex_cfg = exs.catalog['rmb50.rgb.p0.05']._deepcopy()
src_ex_cfg.eras = (MB, None)
src_ex_cfg.m_channels = src_env.m_channels
src_ex_cfg.s_channels = src_env.s_channels

src_ex = explorers.Explorer.create(src_ex_cfg)

Running the Exploration¶

src_explorations, src_s_vectors, src_s_goals = factored.run_exploration(src_env, src_ex, N)

Graph of the source exploration distribution of effects¶

import graphs
graphs.output_notebook()

fig = graphs.spread(src_env.s_channels, s_vectors=src_s_vectors,
                    e_radius=1.5, e_alpha=0.5, title='first arm - {} steps'.format(N))

graphs.show(fig)

Creating reuse dataset¶

src_dataset = {'m_channels': src_env.m_channels,
               's_channels': src_env.s_channels,
               'explorations': src_explorations}

Target Task¶

random.seed(3)

Instanciating the target environment¶

tgt_env_name, tgt_env_cfg = envs.kin(dim=DIM, limit=150, polar=True)
tgt_env_cfg.lengths = [0.9**i for i in range(tgt_env_cfg.dim)]
tgt_env_cfg.lengths = [s/sum(tgt_env_cfg.lengths) for s in tgt_env_cfg.lengths]
tgt_env = environments.Environment.create(tgt_env_cfg)

Instanciating the reuse explorer¶

tgt_ex_cfg                = exs.catalog['random.goal']._deepcopy()
tgt_ex_cfg.eras           = (MB, None)
tgt_ex_cfg.weights        = ((0.0, 0.0, 1.0), (0.0, 1.0, 0.0)) # mb, gb, and reuse probabilities of usage

tgt_ex_cfg.ex_2           = explorers.ReuseExplorer.defcfg._deepcopy()
tgt_ex_cfg.ex_2.reuse.res = RES

tgt_ex_cfg.m_channels = tgt_env.m_channels
tgt_ex_cfg.s_channels = tgt_env.s_channels

tgt_ex = explorers.Explorer.create(tgt_ex_cfg, datasets=[src_dataset])

Running the exploration¶

tgt_explorations, tgt_s_vectors, tgt_s_goals = factored.run_exploration(tgt_env, tgt_ex, N)

Effect selection graph¶

def reused_commands(reuse_cfg, tgt_exploration):
    uid = reuse_cfg.uuid
    expls = []
    for expl in tgt_explorations:
        if uid in expl[0]['uuids']:
            expls.append(expl)
    return expls
        
reused = reused_commands(tgt_ex.cfg.ex_2, tgt_explorations)

reused_src_s_vectors = [tools.to_vector(src_env.execute(r[0]['m_signal'])['s_signal'], src_env.s_channels) 
                        for r in reused]
reused_tgt_s_vectors = [tools.to_vector(tgt_env.execute(r[0]['m_signal'])['s_signal'], tgt_env.s_channels) 
                        for r in reused]

# reuse graphs
selection_fig = graphs.spread(src_env.s_channels, s_vectors=src_s_vectors,
                              e_radius=1.5, e_alpha=0.5, title='first arm - {} steps'.format(N))
graphs.spread(src_env.s_channels, s_vectors=reused_src_s_vectors, fig=selection_fig,
              e_color='#FF030D', e_radius=2.0, e_alpha=1.0, title='first arm - {} steps'.format(N))
graphs.display_grid(selection_fig, x_range=[-1.0, 1.0], y_range=[-1.0, 1.0], 
                    div_x=RES, div_y=RES, color='#666666', alpha=0.5)

graphs.show(selection_fig)

Illustrating reused postures on both arms¶

src_fig = graphs.posture_explorations(src_env, reused, alpha=0.5, radius_factor=0.75, 
                                      title='{} reused commands - source exploration'.format(len(reused)))
tgt_fig = graphs.posture_explorations(tgt_env, reused, alpha=0.5, radius_factor=0.75,
                                      title='{} reused commands - target exploration'.format(len(reused)))

graphs.show([[src_fig, tgt_fig]])

Reuse exploration graph¶

figs = [[]]
for t in [400, N]:
    alpha = 1.0 if t != N else 0.5
    fig = graphs.spread(tgt_env.s_channels, s_vectors=tgt_s_vectors[:t],
                        e_radius=1.5, e_alpha=alpha, title='first arm - {} steps'.format(t))

    graphs.spread(tgt_env.s_channels, s_vectors=tgt_s_vectors[:MB], fig=fig,
              e_color='#FF030D', e_radius=2.0, e_alpha=1.0, title='first arm - {} steps'.format(t))

    figs[0].append(fig)

graphs.show(figs)

No Reuse Exploration¶

random.seed(1)

Instanciating the explorer¶

nor_ex_cfg = exs.catalog['random.goal']._deepcopy()
nor_ex_cfg.eras = (MB, None)
nor_ex_cfg.m_channels = tgt_env.m_channels
nor_ex_cfg.s_channels = tgt_env.s_channels

nor_ex = explorers.Explorer.create(nor_ex_cfg)

Running the exploration¶

nor_explorations, nor_s_vectors, nor_s_goals = factored.run_exploration(tgt_env, nor_ex, N)

Postures generated by random motor babbling¶

# no reuse graphs
nor_fig = graphs.posture_explorations(tgt_env, nor_explorations[:50], alpha=0.50, radius_factor=0.75, 
                                      plot_width=490, plot_height=490, 
                                      title='{} random motor commands'.format(len(reused)))

graphs.show(nor_fig)

Random motor babbling exploration graphs¶

figs = [[]]
for t in [400, N]:
    alpha = 1.0 if t != N else 0.5
    fig = graphs.spread(tgt_env.s_channels, s_vectors=nor_s_vectors[:t],
                        e_radius=1.5, e_alpha=alpha, title='target arm - {} steps'.format(t))
    
    graphs.spread(tgt_env.s_channels, s_vectors=nor_s_vectors[:MB], fig=fig,
              e_color='#FF030D', e_radius=2.0, e_alpha=1.0)

    figs[0].append(fig)
    
graphs.show(figs)

Provenance Data¶

import provenance
prov_data = provenance.planar_arms()
print(prov_data.message())

All the code involved in the execution of this notebook is commited (no git repository in dirty state).
This notebook was executed with commit efe8d71f8242d148d3d1825f0157a48b458eb1d9.

Installed research packages (available in the submodules/ directory):
    clusterjobs  [7505201203af95d3b1074d751c0afac76f3cc619]
    environments [f1937e2ab3a381b29c6a096c9e676d502ed84ce7]
    experiments  [14acbd38d66f996f19e35f3b0a749fc9585fb03f]
    explorers    [1d284f3b1479b935f94b99b8e12c1e9432963421]
    fastlearners [870e9d472f50c0920b66b8f10df1823dbcd9d659]
    learners     [c43380e0e0cd7e6f914dbd9cd2e62e1d87003abc]
    scicfg       [63c4c5c794114ed1606124806b55aa6a56ecb689]

Installed third-party python packages:
    numpy 1.10.4
    scipy 0.17.0
    shapely 1.5.13
    sklearn 0.17

Installed third-party non-python packages:
    geos 3.5.0

Executed with:
    CPython 2.7.11 ('default', 'Feb  2 2016 04:42:29')
    [GCC 4.2.1 Compatible Apple LLVM 7.0.2 (clang-700.1.81)]
    on Darwin Kernel Version 15.3.0: Thu Dec 10 18:40:58 PST 2015; root:xnu-3248.30.4~1/RELEASE_X86_64