diff --git a/hpobench/benchmarks/rl/robot_pushing_benchmark.py b/hpobench/benchmarks/rl/robot_pushing_benchmark.py
new file mode 100644
index 00000000..bc892ca5
--- /dev/null
+++ b/hpobench/benchmarks/rl/robot_pushing_benchmark.py
@@ -0,0 +1,143 @@
+"""
+How to use this benchmark:
+--------------------------
+
+We recommend using the containerized version of this benchmark.
+If you want to use this benchmark locally (without running it via the corresponding container),
+you need to perform the following steps.
+
+Prerequisites:
+==============
+Conda environment in which the HPOBench is installed (pip install .). Activate your environment.
+```
+conda activate <Name_of_Conda_HPOBench_environment>
+pip install pygame==2.0.1 box2d-py==2.3.8
+```
+
+1. Clone from github:
+=====================
+```
+git clone HPOBench
+```
+
+2. Clone and install
+====================
+```
+cd /path/to/HPOBench
+pip install .[paramnet]
+
+```
+
+Changelog:
+==========
+
+0.0.1:
+* First implementation
+"""
+import logging
+from typing import Union, Dict
+
+import ConfigSpace as CS
+import numpy as np
+
+from hpobench.abstract_benchmark import AbstractBenchmark
+from hpobench.util.benchmarks.rl.robot_pushing_utils import PushReward
+
+__version__ = '0.0.1'
+
+logger = logging.getLogger('RobotPushing')
+
+
+class RobotPushingBenchmark(AbstractBenchmark):
+
+    def __init__(self,
+                 rng: Union[np.random.RandomState, int, None] = None):
+        """
+        Parameters
+        ----------
+        rng : np.random.RandomState, int, None
+        """
+        self.simulation = PushReward(gui=False)
+
+        super(RobotPushingBenchmark, self).__init__(rng=rng)
+
+    @staticmethod
+    def get_configuration_space(seed: Union[int, None] = None) -> CS.ConfigurationSpace:
+        from hpobench.util.benchmarks.rl.robot_pushing_utils import PushReward
+        xmin, xmax = PushReward.get_limits()
+
+        cs = CS.ConfigurationSpace(seed=seed)
+        cs.add_hyperparameters([
+            CS.UniformFloatHyperparameter('rx', lower=xmin[0], upper=xmax[0]),
+            CS.UniformFloatHyperparameter('ry', lower=xmin[1], upper=xmax[1]),
+            CS.UniformFloatHyperparameter('xvel', lower=xmin[2], upper=xmax[2]),
+            CS.UniformFloatHyperparameter('yvel', lower=xmin[3], upper=xmax[3]),
+            CS.UniformFloatHyperparameter('simu_steps', lower=xmin[4], upper=xmax[4]),
+            CS.UniformFloatHyperparameter('init_angle', lower=xmin[5], upper=xmax[5]),
+            CS.UniformFloatHyperparameter('rx2', lower=xmin[6], upper=xmax[6]),
+            CS.UniformFloatHyperparameter('ry2', lower=xmin[7], upper=xmax[7]),
+            CS.UniformFloatHyperparameter('xvel2', lower=xmin[8], upper=xmax[8]),
+            CS.UniformFloatHyperparameter('yvel2', lower=xmin[9], upper=xmax[9]),
+            CS.UniformFloatHyperparameter('simu_steps2', lower=xmin[10], upper=xmax[10]),
+            CS.UniformFloatHyperparameter('init_angle2', lower=xmin[11], upper=xmax[11]),
+            CS.UniformFloatHyperparameter('rtor', lower=xmin[12], upper=xmax[12]),
+            CS.UniformFloatHyperparameter('rtor2', lower=xmin[13], upper=xmax[13]),
+            ])
+        return cs
+
+    @staticmethod
+    def get_fidelity_space(seed: Union[int, None] = None) -> CS.ConfigurationSpace:
+        logger.debug('This benchmark has no fidelities.')
+        return CS.ConfigurationSpace()
+
+    @staticmethod
+    def get_meta_information():
+        """ Returns the meta information for the benchmark """
+        return {'name': 'Robot Pushing Benchmark',
+                'references': ['@inproceedings{wang2018batched,'
+                               'title        = {Batched large-scale bayesian optimization in high-dimensional spaces},'
+                               'author       = {Wang, Zi and Gehring, Clement and Kohli, Pushmeet '
+                               '                and Jegelka, Stefanie},'
+                               'booktitle    = {International Conference on Artificial Intelligence and Statistics},'
+                               'pages        = {745--754},'
+                               'year         = {2018},'
+                               'organization = {PMLR}'
+                               '}',
+
+                               '@inproceedings{eriksson2019scalable,'
+                               'title     = {Scalable Global Optimization via Local {Bayesian} Optimization},'
+                               'author    = {Eriksson, David and Pearce, Michael and Gardner, Jacob and Turner, Ryan D '
+                               '             and Poloczek, Matthias},'
+                               'booktitle = {Advances in Neural Information Processing Systems},'
+                               'pages     = {5496--5507},'
+                               'year      = {2019},'
+                               'url = {http://papers.nips.cc/paper/8788-scalable-global-optimization-via-local-bayesian'
+                               '-optimization.pdf}'
+                               '}'],
+                'code': 'https://github.com/zi-w/Ensemble-Bayesian-Optimization/tree/master/test_functions'
+                        'https://github.com/uber-research/TuRBO'
+                }
+
+    @AbstractBenchmark.check_parameters
+    def objective_function(self, configuration: Union[CS.Configuration, Dict],
+                           fidelity: Union[CS.Configuration, Dict, None] = None,
+                           rng: Union[np.random.RandomState, int, None] = None, **kwargs) -> Dict:
+
+        from time import time
+
+        start_time = time()
+
+        distance_to_goal = self.simulation(configuration)
+
+        finish_time = time()
+
+        return {'function_value': distance_to_goal,
+                "cost": finish_time - start_time,
+                'info': {'fidelity': None}}
+
+    @AbstractBenchmark.check_parameters
+    def objective_function_test(self, configuration: Union[CS.Configuration, Dict],
+                                fidelity: Union[CS.Configuration, Dict, None] = None,
+                                rng: Union[np.random.RandomState, int, None] = None, **kwargs) -> Dict:
+
+        return self.objective_function(configuration, fidelity, rng, **kwargs)
diff --git a/hpobench/benchmarks/turBO/__init__.py b/hpobench/benchmarks/turBO/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/hpobench/util/benchmarks/__init__.py b/hpobench/util/benchmarks/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/hpobench/util/benchmarks/rl/__init__.py b/hpobench/util/benchmarks/rl/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/hpobench/util/benchmarks/rl/robot_pushing_utils.py b/hpobench/util/benchmarks/rl/robot_pushing_utils.py
new file mode 100644
index 00000000..59c33179
--- /dev/null
+++ b/hpobench/util/benchmarks/rl/robot_pushing_utils.py
@@ -0,0 +1,285 @@
+"""
+This entire code is from https://github.com/zi-w/Ensemble-Bayesian-Optimization/tree/master/test_functions
+We made some smaller changes similar to the changes described here:
+https://github.com/uber-research/TuRBO#robot-pushing
+"""
+import numpy as np
+import pygame
+from Box2D import b2Vec2, b2_staticBody, b2_dynamicBody, b2PolygonShape, b2CircleShape, b2World
+
+
+class PushReward:
+    def __init__(self, gui=False):
+        # domain of this function
+        self.xmin, self.xmax = self.get_limits()
+
+        # starting xy locations for the two objects
+        self.sxy = (0, 2)
+        self.sxy2 = (0, -2)
+        # goal xy locations for the two objects
+        self.gxy = [4, 3.5]
+        self.gxy2 = [-4, 3.5]
+
+        self.gui = gui
+
+    @staticmethod
+    def get_limits():
+        xmin = [-5., -5., -10., -10., 2., 0., -5., -5., -10., -10., 2., 0., -5., -5.]
+        xmax = [5., 5., 10., 10., 30., 2. * np.pi, 5., 5., 10., 10., 30., 2. * np.pi, 5., 5.]
+        return xmin, xmax
+
+    @property
+    def f_max(self):
+        # maximum value of this function
+        return np.linalg.norm(np.array(self.gxy) - np.array(self.sxy)) \
+               + np.linalg.norm(np.array(self.gxy2) - np.array(self.sxy2))
+
+    def __call__(self, argv):
+        # returns the reward of pushing two objects with two robots
+        rx = float(argv[0])
+        ry = float(argv[1])
+        xvel = float(argv[2])
+        yvel = float(argv[3])
+        simu_steps = int(float(argv[4]) * 10)
+        init_angle = float(argv[5])
+        rx2 = float(argv[6])
+        ry2 = float(argv[7])
+        xvel2 = float(argv[8])
+        yvel2 = float(argv[9])
+        simu_steps2 = int(float(argv[10]) * 10)
+        init_angle2 = float(argv[11])
+        rtor = float(argv[12])
+        rtor2 = float(argv[13])
+
+        initial_dist = self.f_max
+
+        world = b2WorldInterface(do_gui=self.gui)
+        oshape, osize, ofriction, odensity, bfriction, hand_shape, hand_size = \
+            'circle', 1, 0.01, 0.05, 0.01, 'rectangle', (1, 0.3)  # noqa: F841
+
+        base = make_base(500, 500, world)
+        body = create_body(base, world, 'rectangle', (0.5, 0.5), ofriction, odensity, self.sxy)
+        body2 = create_body(base, world, 'circle', 1, ofriction, odensity, self.sxy2)
+
+        robot = end_effector(world, (rx, ry), base, init_angle, hand_shape, hand_size)
+        robot2 = end_effector(world, (rx2, ry2), base, init_angle2, hand_shape, hand_size)
+
+        ret1, ret2 = run_simulation(world, body, body2, robot, robot2, xvel, yvel,
+                                    xvel2, yvel2, rtor, rtor2, simu_steps, simu_steps2)
+
+        ret1 = np.linalg.norm(np.array(self.gxy) - ret1)
+        ret2 = np.linalg.norm(np.array(self.gxy2) - ret2)
+        return initial_dist - ret1 - ret2
+
+
+class guiWorld:
+    def __init__(self, fps):
+        self.SCREEN_WIDTH, self.SCREEN_HEIGHT = 1000, 1000
+        self.TARGET_FPS = fps
+        self.PPM = 10.0  # pixels per meter
+        self.screen = pygame.display.set_mode((self.SCREEN_WIDTH, self.SCREEN_HEIGHT), 0, 32)
+        pygame.display.set_caption('push simulator')
+        self.clock = pygame.time.Clock()
+        self.screen_origin = b2Vec2(self.SCREEN_WIDTH / (2 * self.PPM), self.SCREEN_HEIGHT / (self.PPM * 2))
+        self.colors = {
+            b2_staticBody: (255, 255, 255, 255),
+            b2_dynamicBody: (163, 209, 224, 255)
+        }
+
+    def draw(self, bodies, bg_color=(64, 64, 64, 0)):
+        def my_draw_polygon(polygon, body, fixture):
+            vertices = [(self.screen_origin + body.transform * v) * self.PPM for v in polygon.vertices]
+            vertices = [(v[0], self.SCREEN_HEIGHT - v[1]) for v in vertices]
+            color = self.colors[body.type]
+            if body.userData == "obs":
+                color = (123, 128, 120, 0)
+            if body.userData == "hand":
+                color = (174, 136, 218, 0)
+
+            pygame.draw.polygon(self.screen, color, vertices)
+
+        def my_draw_circle(circle, body, fixture):
+            position = (self.screen_origin + body.transform * circle.pos) * self.PPM
+            position = (position[0], self.SCREEN_HEIGHT - position[1])
+            color = self.colors[body.type]
+            if body.userData == "hand":
+                color = (174, 136, 218, 0)
+            pygame.draw.circle(self.screen, color, [int(x) for x in
+                                                    position], int(circle.radius * self.PPM))
+
+        b2PolygonShape.draw = my_draw_polygon
+        b2CircleShape.draw = my_draw_circle
+        # draw the world
+        self.screen.fill(bg_color)
+        self.clock.tick(self.TARGET_FPS)
+        for body in bodies:
+            for fixture in body.fixtures:
+                fixture.shape.draw(body, fixture)
+        pygame.display.flip()
+
+
+# this is the interface to pybox2d
+class b2WorldInterface:
+    def __init__(self, do_gui=True):
+        self.world = b2World(gravity=(0.0, 0.0), doSleep=True)
+        self.do_gui = do_gui
+        self.TARGET_FPS = 100
+        self.TIME_STEP = 1.0 / self.TARGET_FPS
+        self.VEL_ITERS, self.POS_ITERS = 10, 10
+        self.bodies = []
+
+        if do_gui:
+            self.gui_world = guiWorld(self.TARGET_FPS)
+        else:
+            self.gui_world = None
+
+    def initialize_gui(self):
+        if self.gui_world is None:
+            self.gui_world = guiWorld(self.TARGET_FPS)
+        self.do_gui = True
+
+    def stop_gui(self):
+        self.do_gui = False
+
+    def add_bodies(self, new_bodies):
+        """ add a single b2Body or list of b2Bodies to the world"""
+        if type(new_bodies) == list:
+            self.bodies += new_bodies
+        else:
+            self.bodies.append(new_bodies)
+
+    def step(self, show_display=True, idx=0):
+        self.world.Step(self.TIME_STEP, self.VEL_ITERS, self.POS_ITERS)
+        if show_display and self.do_gui:
+            self.gui_world.draw(self.bodies)
+
+
+class end_effector:
+    def __init__(self, b2world_interface, init_pos, base, init_angle, hand_shape='rectangle', hand_size=(0.3, 1)):
+        world = b2world_interface.world
+        self.hand = world.CreateDynamicBody(position=init_pos, angle=init_angle)
+        self.hand_shape = hand_shape
+        self.hand_size = hand_size
+        # forceunit for circle and rect
+        if hand_shape == 'rectangle':
+            rshape = b2PolygonShape(box=hand_size)
+            self.forceunit = 30.0
+        elif hand_shape == 'circle':
+            rshape = b2CircleShape(radius=hand_size)
+            self.forceunit = 100.0
+        elif hand_shape == 'polygon':
+            rshape = b2PolygonShape(vertices=hand_size)
+        else:
+            raise Exception("%s is not a correct shape" % hand_shape)
+
+        self.hand.CreateFixture(shape=rshape,
+                                density=.1,
+                                friction=.1
+                                )
+        self.hand.userData = "hand"
+
+        friction_joint = world.CreateFrictionJoint(bodyA=base,  # noqa: F841
+                                                   bodyB=self.hand,
+                                                   maxForce=2,
+                                                   maxTorque=2,
+                                                   )
+        b2world_interface.add_bodies(self.hand)
+
+    def set_pos(self, pos, angle):
+        self.hand.position = pos
+        self.hand.angle = angle
+
+    def apply_wrench(self, rlvel=(0, 0), ravel=0):
+
+        avel = self.hand.angularVelocity
+        delta_avel = ravel - avel
+        torque = self.hand.mass * delta_avel * 30.0
+        self.hand.ApplyTorque(torque, wake=True)
+
+        lvel = self.hand.linearVelocity
+        delta_lvel = b2Vec2(rlvel) - b2Vec2(lvel)
+        force = self.hand.mass * delta_lvel * self.forceunit
+        self.hand.ApplyForce(force, self.hand.position, wake=True)
+
+    def get_state(self, verbose=False):
+        state = list(self.hand.position) + [self.hand.angle] + \
+                list(self.hand.linearVelocity) + [self.hand.angularVelocity]
+        if verbose:
+            print_state = ["%.3f" % x for x in state]
+            print("position, velocity: (%s), (%s) " % ((", ").join(print_state[:3]), (", ").join(print_state[3:])))
+
+        return state
+
+
+def create_body(base, b2world_interface, body_shape, body_size, body_friction, body_density, obj_loc):
+    world = b2world_interface.world
+
+    link = world.CreateDynamicBody(position=obj_loc)
+    if body_shape == 'rectangle':
+        linkshape = b2PolygonShape(box=body_size)
+    elif body_shape == 'circle':
+        linkshape = b2CircleShape(radius=body_size)
+    elif body_shape == 'polygon':
+        linkshape = b2PolygonShape(vertices=body_size)
+    else:
+        raise Exception("%s is not a correct shape" % body_shape)
+
+    link.CreateFixture(
+        shape=linkshape,
+        density=body_density,
+        friction=body_friction,
+    )
+    friction_joint = world.CreateFrictionJoint(  # noqa: F841
+        bodyA=base,
+        bodyB=link,
+        maxForce=5,
+        maxTorque=2,
+    )
+
+    b2world_interface.add_bodies([link])
+
+    return link
+
+
+def make_base(table_width, table_length, b2world_interface):
+    world = b2world_interface.world
+    base = world.CreateStaticBody(
+        position=(0, 0),
+        shapes=b2PolygonShape(box=(table_length, table_width)),
+    )
+
+    b2world_interface.add_bodies([base])
+    return base
+
+
+def run_simulation(world, body, body2, robot, robot2, xvel, yvel,
+                   xvel2, yvel2, rtor, rtor2, simulation_steps,
+                   simulation_steps2):
+    # simulating push with fixed direction pointing from robot location to body location
+    desired_vel = np.array([xvel, yvel])
+
+    # Adaptation in TurBO paper: Reduce noice from 0.01 to 1e-6
+    rvel = b2Vec2(desired_vel[0] + np.random.normal(0, 1e-6), desired_vel[1] + np.random.normal(0, 1e-6))
+
+    desired_vel2 = np.array([xvel2, yvel2])
+    rvel2 = b2Vec2(desired_vel2[0] + np.random.normal(0, 1e-6), desired_vel2[1] + np.random.normal(0, 1e-6))
+
+    tmax = np.max([simulation_steps, simulation_steps2])
+
+    for t in range(tmax + 100):
+        if t < simulation_steps:
+            robot.apply_wrench(rvel, rtor)
+        if t < simulation_steps2:
+            robot2.apply_wrench(rvel2, rtor2)
+        world.step()
+
+    return list(body.position), list(body2.position)
+
+
+# if __name__ == '__main__':
+#     f = PushReward(gui=False)
+#     x = np.random.uniform(f.xmin, f.xmax)
+#     x = f.xmax
+#     x[4] = f.xmin[4]
+#     print('Input = {}'.format(x))
+#     print('Output = {}'.format(f(x)))