diff --git a/models/rllab_humanoid.xml b/models/rllab_humanoid.xml
new file mode 100644
index 000000000..33faa6754
--- /dev/null
+++ b/models/rllab_humanoid.xml
@@ -0,0 +1,135 @@
+<mujoco model='humanoid'>
+  <compiler inertiafromgeom='true' angle='degree' />
+  <custom>
+    <numeric name="frame_skip" data="4" />
+  </custom>
+  <default>
+    <joint limited='true' damping='1' armature='0' />
+    <geom contype='1' conaffinity='1' condim='1' rgba='0.8 0.6 .4 1' margin="0.001" solref=".02 1" solimp=".8 .8 .01" material="geom" />
+    <motor ctrlrange='-.4 .4' ctrllimited='true' />
+  </default>
+  <option timestep='0.002' integrator="RK4" iterations="50" solver="PGS">
+  </option>
+  <size nuser_geom='1' nkey='5' />
+  <visual>
+    <map fogstart="3" fogend="5" />
+  </visual>
+  <asset>
+    <texture type="skybox" builtin="gradient" width="100" height="100" rgb1="1 1 1" rgb2="0 0 0" />
+    <texture name="texgeom" type="cube" builtin="flat" mark="cross" width="127" height="1278" rgb1="0.8 0.6 0.4" rgb2="0.8 0.6 0.4" markrgb="1 1 1" random="0.01" />
+    <texture name="texplane" type="2d" builtin="checker" rgb1="0 0 0" rgb2="0.8 0.8 0.8" width="100" height="100" />
+    <material name='MatPlane' texture="texplane" shininess="1" texrepeat="60 60" specular="1"  reflectance="0.5" />
+    <material name='geom' texture="texgeom" texuniform="true" />
+  </asset>
+  <worldbody>
+    <light directional="true" cutoff="100" exponent="1" diffuse="1 1 1" specular=".1 .1 .1" pos="0 0 1.3" dir="-0 0 -1.3" />
+    <geom name='floor' material="MatPlane" pos='0 0 0' size='40 40 40' type='plane' conaffinity='1' rgba='0.8 0.9 0.8 1' condim='3' />
+    <body name='torso' pos='0 0 1.4'>
+      <joint name='root' type='free' pos='0 0 0' limited='false' damping='0' armature='0' stiffness='0' />
+      <geom name='torso1' type='capsule' fromto='0 -.07 0 0 .07 0' size='0.07' />
+      <geom name='head' type='sphere' pos='0 0 .19' size='.09' user='258' />
+      <geom name='uwaist' type='capsule' fromto='-.01 -.06 -.12 -.01 .06 -.12' size='0.06' />
+      <body name='lwaist' pos='-.01 0 -0.260' quat='1.000 0 -0.002 0'>
+        <geom name='lwaist' type='capsule' fromto='0 -.06 0 0 .06 0' size='0.06' />
+        <joint name='abdomen_z' type='hinge' pos='0 0 0.065' axis='0 0 1' range='-45 45' damping='5' stiffness='20' armature='0.02' />
+        <joint name='abdomen_y' type='hinge' pos='0 0 0.065' axis='0 1 0' range='-75 30' damping='5' stiffness='10' armature='0.02' />
+        <body name='pelvis' pos='0 0 -0.165' quat='1.000 0 -0.002 0'>
+          <joint name='abdomen_x' type='hinge' pos='0 0 0.1' axis='1 0 0' range='-35 35' damping='5' stiffness='10' armature='0.02' />
+          <geom name='butt' type='capsule' fromto='-.02 -.07 0 -.02 .07 0' size='0.09' />
+          <body name='right_thigh' pos='0 -0.1 -0.04'>
+            <joint name='right_hip_x' type='hinge' pos='0 0 0' axis='1 0 0' range='-25 5' damping='5' stiffness='10' armature='0.01' />
+            <joint name='right_hip_z' type='hinge' pos='0 0 0' axis='0 0 1' range='-60 35' damping='5' stiffness='10' armature='0.01' />
+            <joint name='right_hip_y' type='hinge' pos='0 0 0' axis='0 1 0' range='-110 20' damping='5' stiffness='20' armature='0.0080' />
+            <geom name='right_thigh1' type='capsule' fromto='0 0 0 0 0.01 -.34' size='0.06' />
+            <body name='right_shin' pos='0 0.01 -0.403'>
+              <joint name='right_knee' type='hinge' pos='0 0 .02' axis='0 -1 0' range='-160 -2' armature='0.0060' />
+              <geom name='right_shin1' type='capsule' fromto='0 0 0 0 0 -.3' size='0.049' />
+              <body name='right_foot' pos='0 0 -.39'>
+                <joint name='right_ankle_y' type='hinge' pos='0 0 0.08' axis='0 1 0' range='-50 50' stiffness='4' armature='0.0008' />
+                <joint name='right_ankle_x' type='hinge' pos='0 0 0.04' axis='1 0 0.5' range='-50 50' stiffness='1' armature='0.0006' />
+                <geom name='right_foot_cap1' type='capsule' fromto='-.07 -0.02 0 0.14 -0.04 0' size='0.027' />
+                <geom name='right_foot_cap2' type='capsule' fromto='-.07 0 0 0.14 0.02 0' size='0.027' />
+              </body>
+            </body>
+          </body>
+          <body name='left_thigh' pos='0 0.1 -0.04'>
+            <joint name='left_hip_x' type='hinge' pos='0 0 0' axis='-1 0 0' range='-25 5' damping='5' stiffness='10' armature='0.01' />
+            <joint name='left_hip_z' type='hinge' pos='0 0 0' axis='0 0 -1' range='-60 35' damping='5' stiffness='10' armature='0.01' />
+            <joint name='left_hip_y' type='hinge' pos='0 0 0' axis='0 1 0' range='-120 20' damping='5' stiffness='20' armature='0.01' />
+            <geom name='left_thigh1' type='capsule' fromto='0 0 0 0 -0.01 -.34' size='0.06' />
+            <body name='left_shin' pos='0 -0.01 -0.403'>
+              <joint name='left_knee' type='hinge' pos='0 0 .02' axis='0 -1 0' range='-160 -2' stiffness='1' armature='0.0060' />
+              <geom name='left_shin1' type='capsule' fromto='0 0 0 0 0 -.3' size='0.049' />
+              <body name='left_foot' pos='0 0 -.39'>
+                <joint name='left_ankle_y' type='hinge' pos='0 0 0.08' axis='0 1 0' range='-50 50' stiffness='4' armature='0.0008' />
+                <joint name='left_ankle_x' type='hinge' pos='0 0 0.04' axis='1 0 0.5' range='-50 50' stiffness='1' armature='0.0006' />
+                <geom name='left_foot_cap1' type='capsule' fromto='-.07 0.02 0 0.14 0.04 0' size='0.027' />
+                <geom name='left_foot_cap2' type='capsule' fromto='-.07 0 0 0.14 -0.02 0' size='0.027' />
+              </body>
+            </body>
+          </body>
+        </body>
+      </body>
+      <body name='right_upper_arm' pos='0 -0.17 0.06'>
+        <joint name='right_shoulder1' type='hinge' pos='0 0 0' axis='2 1 1' range='-85 60' stiffness='1' armature='0.0068' />
+        <joint name='right_shoulder2' type='hinge' pos='0 0 0' axis='0 -1 1' range='-85 60' stiffness='1' armature='0.0051' />
+        <geom name='right_uarm1' type='capsule' fromto='0 0 0 .16 -.16 -.16' size='0.04 0.16' />
+        <body name='right_lower_arm' pos='.18 -.18 -.18'>
+          <joint name='right_elbow' type='hinge' pos='0 0 0' axis='0 -1 1' range='-90 50' stiffness='0' armature='0.0028' />
+          <geom name='right_larm' type='capsule' fromto='0.01 0.01 0.01 .17 .17 .17' size='0.031' />
+          <geom name='right_hand' type='sphere' pos='.18 .18 .18' size='0.04' />
+          <camera pos="0 0 0" />
+        </body>
+      </body>
+      <body name='left_upper_arm' pos='0 0.17 0.06'>
+        <joint name='left_shoulder1' type='hinge' pos='0 0 0' axis='2 -1 1' range='-60 85' stiffness='1' armature='0.0068' />
+        <joint name='left_shoulder2' type='hinge' pos='0 0 0' axis='0 1 1' range='-60 85' stiffness='1' armature='0.0051' />
+        <geom name='left_uarm1' type='capsule' fromto='0 0 0 .16 .16 -.16' size='0.04 0.16' />
+        <body name='left_lower_arm' pos='.18 .18 -.18'>
+          <joint name='left_elbow' type='hinge' pos='0 0 0' axis='0 -1 -1' range='-90 50' stiffness='0' armature='0.0028' />
+          <geom name='left_larm' type='capsule' fromto='0.01 -0.01 0.01 .17 -.17 .17' size='0.031' />
+          <geom name='left_hand' type='sphere' pos='.18 -.18 .18' size='0.04' />
+        </body>
+      </body>
+    </body>
+  </worldbody>
+  <tendon>
+    <fixed name='left_hipknee'>
+      <joint joint='left_hip_y' coef='-1' />
+      <joint joint='left_knee' coef='1' />
+    </fixed>
+    <fixed name='right_hipknee'>
+      <joint joint='right_hip_y' coef='-1' />
+      <joint joint='right_knee' coef='1' />
+    </fixed>
+  </tendon>
+  <keyframe>
+    <key qpos='-0.0233227 0.00247283 0.0784829 0.728141 0.00223397 -0.685422 -0.00181805 -0.000580139 -0.245119 0.0329713 -0.0461148 0.0354257 0.252234 -0.0347763 -0.4663 -0.0313013 0.0285638 0.0147285 0.264063 -0.0346441 -0.559198 0.021724 -0.0333332 -0.718563 0.872778 0.000260393 0.733088 0.872748' />
+    <key qpos='0.0168601 -0.00192002 0.127167 0.762693 0.00191588 0.646754 -0.00210291 -0.000199049 0.0573113 -4.05731e-005 0.0134177 -0.00468944 0.0985945 -0.282695 -0.0469067 0.00874203 0.0263262 -0.00295056 0.0984851 -0.282098 -0.044293 0.00475795 0.127371 -0.42895 0.882402 -0.0980573 0.428506 0.88193' />
+    <key qpos='0.000471586 0.0317577 0.210587 0.758805 -0.583984 0.254155 0.136322 -0.0811633 0.0870309 -0.0935227 0.0904958 -0.0278004 -0.00978614 -0.359193 0.139761 -0.240168 0.060149 0.237062 -0.00622109 -0.252598 -0.00376874 -0.160597 0.25253 -0.278634 0.834376 -0.990444 -0.169065 0.652876' />
+    <key qpos='-0.0602175 0.048078 0.194579 -0.377418 -0.119412 -0.675073 -0.622553 0.139093 0.0710746 -0.0506027 0.0863461 0.196165 -0.0276685 -0.521954 -0.267784 0.179051 0.0371897 0.0560134 -0.032595 -0.0480022 0.0357436 0.108502 0.963806 0.157805 0.873092 -1.01145 -0.796409 0.24736' />
+  </keyframe>
+  <actuator>
+    <motor name='abdomen_y' gear='200' joint='abdomen_y' />
+    <motor name='abdomen_z' gear='200' joint='abdomen_z' />
+    <motor name='abdomen_x' gear='200' joint='abdomen_x' />
+    <motor name='right_hip_x' gear='200' joint='right_hip_x' />
+    <motor name='right_hip_z' gear='200' joint='right_hip_z' />
+    <motor name='right_hip_y' gear='600' joint='right_hip_y' />
+    <motor name='right_knee' gear='400' joint='right_knee' />
+    <motor name='right_ankle_x' gear='100' joint='right_ankle_x' />
+    <motor name='right_ankle_y' gear='100' joint='right_ankle_y' />
+    <motor name='left_hip_x' gear='200' joint='left_hip_x' />
+    <motor name='left_hip_z' gear='200' joint='left_hip_z' />
+    <motor name='left_hip_y' gear='600' joint='left_hip_y' />
+    <motor name='left_knee' gear='400' joint='left_knee' />
+    <motor name='left_ankle_x' gear='100' joint='left_ankle_x' />
+    <motor name='left_ankle_y' gear='100' joint='left_ankle_y' />
+    <motor name='right_shoulder1' gear='100' joint='right_shoulder1' />
+    <motor name='right_shoulder2' gear='100' joint='right_shoulder2' />
+    <motor name='right_elbow' gear='200' joint='right_elbow' />
+    <motor name='left_shoulder1' gear='100' joint='left_shoulder1' />
+    <motor name='left_shoulder2' gear='100' joint='left_shoulder2' />
+    <motor name='left_elbow' gear='200' joint='left_elbow' />
+  </actuator>
+</mujoco>
diff --git a/models/rllab_swimmer.xml b/models/rllab_swimmer.xml
new file mode 100644
index 000000000..e321031f0
--- /dev/null
+++ b/models/rllab_swimmer.xml
@@ -0,0 +1,43 @@
+<mujoco model="swimmer">
+  <compiler inertiafromgeom="true" angle="degree" coordinate="local" />
+  <custom>
+    <numeric name="frame_skip" data="50" />
+  </custom>
+  <option timestep="0.001" density="4000" viscosity="0.1" collision="predefined" integrator="Euler" iterations="1000">
+    <flag warmstart="disable" />
+  </option>
+  <default>
+    <geom contype='1' conaffinity='1' condim='1' rgba='0.8 0.6 .4 1' material="geom" />
+    <!--<joint armature='1'  />-->
+  </default>
+  <asset>
+    <texture type="skybox" builtin="gradient" width="100" height="100" rgb1="1 1 1" rgb2="0 0 0" />
+    <texture name="texgeom" type="cube" builtin="flat" mark="cross" width="127" height="1278" rgb1="0.8 0.6 0.4" rgb2="0.8 0.6 0.4" markrgb="1 1 1" random="0.01" />
+    <texture name="texplane" type="2d" builtin="checker" rgb1="0 0 0" rgb2="0.8 0.8 0.8" width="100" height="100" />
+    <material name='MatPlane' texture="texplane" shininess="1" texrepeat="30 30" specular="1"  reflectance="0.5" />
+    <material name='geom' texture="texgeom" texuniform="true" />
+  </asset>
+  <worldbody>
+    <light directional="true" cutoff="100" exponent="1" diffuse="1 1 1" specular=".1 .1 .1" pos="0 0 1.3" dir="-0 0 -1.3" />
+    <geom name='floor' material="MatPlane" pos='0 0 -0.1' size='40 40 0.1' type='plane' conaffinity='1' rgba='0.8 0.9 0.8 1' condim='3' />
+    <!--  ================= SWIMMER ================= /-->
+    <body name="torso" pos="0 0 0">
+      <geom name="torso" type="capsule" fromto="1.5 0 0 0.5 0 0" size="0.1" density="1000" />
+      <joint pos="0 0 0" type="slide" name="slider1" axis="1 0 0" />
+      <joint pos="0 0 0" type="slide" name="slider2" axis="0 1 0" />
+      <joint name="rot" type="hinge" pos="0 0 0" axis="0 0 1" />
+      <body name="mid" pos="0.5 0 0">
+        <geom name="mid" type="capsule" fromto="0 0 0 -1 0 0" size="0.1" density="1000" />
+        <joint name="rot2" type="hinge" pos="0 0 0" axis="0 0 1" range="-100 100" limited="true" />
+        <body name="back" pos="-1 0 0">
+          <geom name="back" type="capsule" fromto="0 0 0 -1 0 0" size="0.1" density="1000" />
+          <joint name="rot3" type="hinge" pos="0 0 0" axis="0 0 1" range="-100 100" limited="true" />
+        </body>
+      </body>
+    </body>
+  </worldbody>
+  <actuator>
+    <motor joint="rot2" ctrllimited="true" ctrlrange="-50 50" />
+    <motor joint="rot3" ctrllimited="true" ctrlrange="-50 50" />
+  </actuator>
+</mujoco>
diff --git a/softlearning/environments/gym/__init__.py b/softlearning/environments/gym/__init__.py
index 00167fec9..ce57b31cd 100644
--- a/softlearning/environments/gym/__init__.py
+++ b/softlearning/environments/gym/__init__.py
@@ -61,6 +61,16 @@
         'entry_point': (f'{MUJOCO_ENVIRONMENTS_PATH}'
                         '.image_pusher_2d:BlindForkReacher2dEnv'),
     },
+    {
+        'id': 'Humanoid-RLLab-v0',
+        'entry_point': (f'{MUJOCO_ENVIRONMENTS_PATH}'
+                        '.rllab_humanoid:RLLabHumanoidEnv'),
+    },
+    {
+        'id': 'Swimmer-RLLab-v0',
+        'entry_point': (f'{MUJOCO_ENVIRONMENTS_PATH}'
+                        '.rllab_swimmer:RLLabSwimmerEnv'),
+    },
 )
 
 GENERAL_ENVIRONMENT_SPECS = (
diff --git a/softlearning/environments/gym/mujoco/rllab_humanoid.py b/softlearning/environments/gym/mujoco/rllab_humanoid.py
new file mode 100644
index 000000000..5d938a907
--- /dev/null
+++ b/softlearning/environments/gym/mujoco/rllab_humanoid.py
@@ -0,0 +1,82 @@
+import os.path as osp
+import numpy as np
+
+from gym.envs.mujoco.mujoco_env import MujocoEnv
+
+from serializable import Serializable
+
+from softlearning.misc.utils import PROJECT_PATH
+
+"""
+Environment based off of the HumanoidEnv found in rllab 
+https://github.com/rll/rllab/blob/master/rllab/envs/mujoco/simple_humanoid_env.py
+"""
+class RLLabHumanoidEnv(Serializable, MujocoEnv):
+
+    MODEL_PATH = osp.abspath(
+        osp.join(PROJECT_PATH, 'models', 'rllab_humanoid.xml'))
+
+    def __init__(
+            self,
+            vel_deviation_cost_coeff=1e-2,
+            alive_bonus=0.2,
+            ctrl_cost_coeff=1e-3,
+            impact_cost_coeff=1e-5,
+            *args, **kwargs):
+        self._Serializable__initialize(locals())
+        self.vel_deviation_cost_coeff = vel_deviation_cost_coeff
+        self.alive_bonus = alive_bonus
+        self.ctrl_cost_coeff = ctrl_cost_coeff
+        self.impact_cost_coeff = impact_cost_coeff
+        MujocoEnv.__init__(self, model_path=self.MODEL_PATH, frame_skip=5, *args, **kwargs)
+
+    def _get_obs(self):
+        data = self.sim.data
+        return np.concatenate([
+            data.qpos.flat,
+            data.qvel.flat,
+            np.clip(data.cfrc_ext, -1, 1).flat,
+            self.get_body_com("torso").flat,
+        ])
+
+    def _get_com(self):
+        data = self.sim.data
+        mass = self.model.body_mass[:, None]
+        xpos = data.xipos
+        return (np.sum(mass * xpos, 0) / np.sum(mass))
+
+
+    def step(self, action):
+        pos_before = self._get_com()
+        self.do_simulation(action, self.frame_skip)
+        pos_after = self._get_com()
+        next_obs = self._get_obs()
+
+        alive_bonus = self.alive_bonus
+        data = self.sim.data
+
+        # velocity computation was originally done by mujoco rather than finite differences
+        comvel = (pos_after - pos_before) / self.dt
+        lin_vel_reward = comvel[0]
+        lb, ub = self.action_space.low, self.action_space.high
+        scaling = (ub - lb) * 0.5
+        ctrl_cost = .5 * self.ctrl_cost_coeff * np.sum(
+            np.square(action / scaling))
+        impact_cost = .5 * self.impact_cost_coeff * np.sum(
+            np.square(np.clip(data.cfrc_ext, -1, 1)))
+        vel_deviation_cost = 0.5 * self.vel_deviation_cost_coeff * np.sum(
+            np.square(comvel[1:]))
+        reward = lin_vel_reward + alive_bonus - ctrl_cost - \
+            impact_cost - vel_deviation_cost
+        done = data.qpos[2] < 0.8 or data.qpos[2] > 2.0
+        env_infos = dict(reward_linvel=lin_vel_reward,
+                         reward_ctrl=-ctrl_cost,
+                         reward_alive=alive_bonus)
+
+        return next_obs, reward, done, env_infos
+    
+    def reset_model(self):
+        self.set_state(self.init_qpos + np.random.normal(size=self.init_qpos.shape) * 0.01,
+                self.init_qvel + np.random.normal(size=self.init_qvel.shape) * 0.1)
+        return self._get_obs()
+
diff --git a/softlearning/environments/gym/mujoco/rllab_swimmer.py b/softlearning/environments/gym/mujoco/rllab_swimmer.py
new file mode 100644
index 000000000..3d54ecae4
--- /dev/null
+++ b/softlearning/environments/gym/mujoco/rllab_swimmer.py
@@ -0,0 +1,60 @@
+import os.path as osp
+import numpy as np
+
+from gym.envs.mujoco.mujoco_env import MujocoEnv
+
+from serializable import Serializable
+
+from softlearning.misc.utils import PROJECT_PATH
+
+"""
+Environment based off of the SwimmerEnv found in rllab 
+https://github.com/rll/rllab/blob/master/rllab/envs/mujoco/swimmer_env.py
+"""
+class RLLabSwimmerEnv(MujocoEnv, Serializable):
+
+    MODEL_PATH = osp.abspath(
+        osp.join(PROJECT_PATH, 'models', 'rllab_swimmer.xml'))
+    ORI_IND = 2
+
+    def __init__(
+                self,
+                ctrl_cost_coeff=1e-2,
+                *args, **kwargs):
+            self._Serializable__initialize(locals())
+            self.ctrl_cost_coeff = ctrl_cost_coeff
+            MujocoEnv.__init__(self, model_path=self.MODEL_PATH, frame_skip=5, *args, **kwargs)
+
+    def _get_obs(self):
+        return np.concatenate([
+            self.sim.data.qpos.flat,
+            self.sim.data.qvel.flat,
+            # self.get_body_com("torso").flat,
+        ]).reshape(-1)
+
+    def get_ori(self):
+        return self.sim.data.qpos[self.__class__.ORI_IND]
+
+    def reset_model(self):
+        self.set_state(self.init_qpos + np.random.normal(size=self.init_qpos.shape) * 0.01,
+                self.init_qvel + np.random.normal(size=self.init_qvel.shape) * 0.1)
+        return self._get_obs()
+
+    def step(self, action):
+        # pos_before = self.get_body_com("torso")[0]
+        pos_before = self.sim.data.qpos[0]
+        self.do_simulation(action, self.frame_skip)
+        pos_after = self.sim.data.qpos[0]
+        next_obs = self._get_obs()
+        lb, ub = self.action_space.low, self.action_space.high
+        scaling = (ub - lb) * 0.5
+        ctrl_cost = 0.5 * self.ctrl_cost_coeff * np.sum(
+            np.square(action / scaling))
+        forward_reward = (pos_after - pos_before) / self.dt
+        reward = forward_reward - ctrl_cost
+        done = False
+        env_infos = dict(reward_forward=forward_reward,
+                         reward_ctrl=-ctrl_cost,
+                        )
+        
+        return next_obs, reward, done, env_infos