diff --git a/examples/scripts/reinforcement_learning/simple_cart_pole/README.md b/examples/scripts/reinforcement_learning/simple_cart_pole/README.md
new file mode 100644
index 0000000000..3bb276b1d4
--- /dev/null
+++ b/examples/scripts/reinforcement_learning/simple_cart_pole/README.md
@@ -0,0 +1,37 @@
+# Example for Reinforcement Learning (RL) With Gazebo
+
+This demo world shows you an example of how you can use SDFormat, Ray-RLLIB and Gazebo to perform RL with python.
+We start with a very simple cart-pole world. This world is defined in our sdf file `cart_pole.sdf`. It is analogous to
+the
+
+## Create a VENV
+
+First create a virtual environment using python,
+```
+python3 -m venv venv
+```
+Lets activate it and install rayrllib and pytorch.
+```
+. venv/bin/activate
+```
+
+Lets install our dependencies
+```
+pip install "ray[rllib]" torch
+```
+
+In the same terminal you should add your gazebo python install directory to the `PYTHONPATH`
+If you built gazebo from source in the current working directory this would be:
+```
+export PYTHONPATH=$PYTHONPATH:install/lib/python
+```
+
+You will also need to set PROTOCOL_BUFFERS_PYTHON_IMPLEMENTATION to python due to version
+mis-matches.
+```
+export PROTOCOL_BUFFERS_PYTHON_IMPLEMENTATION=python
+```
+
+## Exploring the environment
+
+You can see the environment by using `gz sim cart_pole.sdf`.
\ No newline at end of file
diff --git a/examples/scripts/reinforcement_learning/simple_cart_pole/cart_pole.sdf b/examples/scripts/reinforcement_learning/simple_cart_pole/cart_pole.sdf
new file mode 100644
index 0000000000..6c1a1cd0de
--- /dev/null
+++ b/examples/scripts/reinforcement_learning/simple_cart_pole/cart_pole.sdf
@@ -0,0 +1,368 @@
+<?xml version="1.0" ?>
+<!--
+  Gazebo differential drive plugin demo
+
+  Try sending commands:
+
+    gz topic -t "/model/vehicle_blue/cmd_vel" -m gz.msgs.Twist -p "linear: {x: 0.5}, angular: {z: 0.05}"
+
+    gz topic -t "/model/vehicle_green/cmd_vel" -m gz.msgs.Twist -p "linear: {x: 1.0}, angular: {z: -0.1}"
+
+  Listen to odometry:
+
+    gz topic -e -t /model/vehicle_blue/odometry
+
+    gz topic -e -t /model/vehicle_green/odometry
+
+-->
+<sdf version="1.6">
+  <world name="diff_drive">
+
+    <physics name="1ms" type="ignored">
+      <max_step_size>0.001</max_step_size>
+      <real_time_factor>1.0</real_time_factor>
+    </physics>
+    <plugin
+      filename="gz-sim-physics-system"
+      name="gz::sim::systems::Physics">
+    </plugin>
+    <plugin
+      filename="gz-sim-user-commands-system"
+      name="gz::sim::systems::UserCommands">
+    </plugin>
+    <plugin
+      filename="gz-sim-scene-broadcaster-system"
+      name="gz::sim::systems::SceneBroadcaster">
+    </plugin>
+
+    <light type="directional" name="sun">
+      <cast_shadows>true</cast_shadows>
+      <pose>0 0 10 0 0 0</pose>
+      <diffuse>1 1 1 1</diffuse>
+      <specular>0.5 0.5 0.5 1</specular>
+      <attenuation>
+        <range>1000</range>
+        <constant>0.9</constant>
+        <linear>0.01</linear>
+        <quadratic>0.001</quadratic>
+      </attenuation>
+      <direction>-0.5 0.1 -0.9</direction>
+    </light>
+
+    <model name="ground_plane">
+      <static>true</static>
+      <link name="link">
+        <collision name="collision">
+          <geometry>
+            <plane>
+              <normal>0 0 1</normal>
+              <size>100 100</size>
+            </plane>
+          </geometry>
+        </collision>
+        <visual name="visual">
+          <geometry>
+            <plane>
+              <normal>0 0 1</normal>
+              <size>100 100</size>
+            </plane>
+          </geometry>
+          <material>
+            <ambient>0.8 0.8 0.8 1</ambient>
+            <diffuse>0.8 0.8 0.8 1</diffuse>
+            <specular>0.8 0.8 0.8 1</specular>
+          </material>
+        </visual>
+      </link>
+    </model>
+
+    <model name='vehicle_green'>
+      <pose>0 0 0.325 0 -0 0</pose>
+
+      <link name='pole'>
+        <pose>-0.151427 -0 1.5 0 -0 0</pose>
+        <inertial>
+          <mass>0.1</mass>
+          <inertia>
+            <ixx>0.126164</ixx>
+            <ixy>0</ixy>
+            <ixz>0</ixz>
+            <iyy>0.416519</iyy>
+            <iyz>0</iyz>
+            <izz>0.481014</izz>
+          </inertia>
+        </inertial>
+        <visual name='visual'>
+          <geometry>
+            <box>
+              <size>0.2 0.2 1.5</size>
+            </box>
+          </geometry>
+          <material>
+            <ambient>0.5 1.0 0.5 1</ambient>
+            <diffuse>0.5 1.0 0.5 1</diffuse>
+            <specular>0.0 1.0 0.0 1</specular>
+          </material>
+        </visual>
+        <collision name='collision'>
+          <geometry>
+            <box>
+              <size>0.2 0.2 1.5</size>
+            </box>
+          </geometry>
+        </collision>
+      </link>
+
+      <link name='pole_mass'>
+        <pose>-0.151427 0 2.2 0 -0 0</pose>
+        <inertial>
+          <mass>10.0</mass>
+          <inertia>
+            <ixx>1.26164</ixx>
+            <ixy>0</ixy>
+            <ixz>0</ixz>
+            <iyy>4.16519</iyy>
+            <iyz>0</iyz>
+            <izz>4.81014</izz>
+          </inertia>
+        </inertial>
+        <visual name='visual'>
+          <geometry>
+            <box>
+              <size>0.3 0.3 0.3</size>
+            </box>
+          </geometry>
+          <material>
+            <ambient>0.5 1.0 0.5 1</ambient>
+            <diffuse>0.5 1.0 0.5 1</diffuse>
+            <specular>0.0 1.0 0.0 1</specular>
+          </material>
+        </visual>
+        <collision name='collision'>
+          <geometry>
+            <box>
+              <size>0.3 0.3 0.3</size>
+            </box>
+          </geometry>
+        </collision>
+      </link>
+
+      <link name='chassis'>
+        <pose>-0.151427 -0 0.175 0 -0 0</pose>
+        <inertial>
+          <mass>1.14395</mass>
+          <inertia>
+            <ixx>0.126164</ixx>
+            <ixy>0</ixy>
+            <ixz>0</ixz>
+            <iyy>0.416519</iyy>
+            <iyz>0</iyz>
+            <izz>0.481014</izz>
+          </inertia>
+        </inertial>
+        <visual name='visual'>
+          <geometry>
+            <box>
+              <size>2.01142 1 0.568726</size>
+            </box>
+          </geometry>
+          <material>
+            <ambient>0.5 1.0 0.5 1</ambient>
+            <diffuse>0.5 1.0 0.5 1</diffuse>
+            <specular>0.0 1.0 0.0 1</specular>
+          </material>
+        </visual>
+        <collision name='collision'>
+          <geometry>
+            <box>
+              <size>2.01142 1 0.568726</size>
+            </box>
+          </geometry>
+        </collision>
+      </link>
+
+      <link name='left_wheel'>
+        <pose>0.554283 0.625029 -0.025 -1.5707 0 0</pose>
+        <inertial>
+          <mass>2</mass>
+          <inertia>
+            <ixx>0.145833</ixx>
+            <ixy>0</ixy>
+            <ixz>0</ixz>
+            <iyy>0.145833</iyy>
+            <iyz>0</iyz>
+            <izz>0.125</izz>
+          </inertia>
+        </inertial>
+        <visual name='visual'>
+          <geometry>
+            <sphere>
+              <radius>0.3</radius>
+            </sphere>
+          </geometry>
+          <material>
+            <ambient>0.2 0.2 0.2 1</ambient>
+            <diffuse>0.2 0.2 0.2 1</diffuse>
+            <specular>0.2 0.2 0.2 1</specular>
+          </material>
+        </visual>
+        <collision name='collision'>
+          <geometry>
+            <sphere>
+              <radius>0.3</radius>
+            </sphere>
+          </geometry>
+          <surface>
+            <friction>
+              <ode>
+                <mu>1</mu>
+                <mu2>1</mu2>
+                <slip1>0.035</slip1>
+                <slip2>0</slip2>
+                <fdir1>0 0 1</fdir1>
+              </ode>
+              <bullet>
+                <friction>1</friction>
+                <friction2>1</friction2>
+                <rolling_friction>0.1</rolling_friction>
+              </bullet>
+            </friction>
+          </surface>
+        </collision>
+      </link>
+
+      <link name='right_wheel'>
+        <pose>0.554282 -0.625029 -0.025 -1.5707 0 0</pose>
+        <inertial>
+          <mass>2</mass>
+          <inertia>
+            <ixx>0.145833</ixx>
+            <ixy>0</ixy>
+            <ixz>0</ixz>
+            <iyy>0.145833</iyy>
+            <iyz>0</iyz>
+            <izz>0.125</izz>
+          </inertia>
+        </inertial>
+        <visual name='visual'>
+          <geometry>
+            <sphere>
+              <radius>0.3</radius>
+            </sphere>
+          </geometry>
+          <material>
+            <ambient>0.2 0.2 0.2 1</ambient>
+            <diffuse>0.2 0.2 0.2 1</diffuse>
+            <specular>0.2 0.2 0.2 1</specular>
+          </material>
+        </visual>
+        <collision name='collision'>
+          <geometry>
+            <sphere>
+              <radius>0.3</radius>
+            </sphere>
+          </geometry>
+          <surface>
+            <friction>
+              <ode>
+                <mu>1</mu>
+                <mu2>1</mu2>
+                <slip1>0.035</slip1>
+                <slip2>0</slip2>
+                <fdir1>0 0 1</fdir1>
+              </ode>
+              <bullet>
+                <friction>1</friction>
+                <friction2>1</friction2>
+                <rolling_friction>0.1</rolling_friction>
+              </bullet>
+            </friction>
+          </surface>
+        </collision>
+      </link>
+
+      <link name='caster'>
+        <pose>-0.957138 -0 -0.125 0 -0 0</pose>
+        <inertial>
+          <mass>1</mass>
+          <inertia>
+            <ixx>0.1</ixx>
+            <ixy>0</ixy>
+            <ixz>0</ixz>
+            <iyy>0.1</iyy>
+            <iyz>0</iyz>
+            <izz>0.1</izz>
+          </inertia>
+        </inertial>
+        <visual name='visual'>
+          <geometry>
+            <sphere>
+              <radius>0.2</radius>
+            </sphere>
+          </geometry>
+          <material>
+            <ambient>0.2 0.2 0.2 1</ambient>
+            <diffuse>0.2 0.2 0.2 1</diffuse>
+            <specular>0.2 0.2 0.2 1</specular>
+          </material>
+        </visual>
+        <collision name='collision'>
+          <geometry>
+            <sphere>
+              <radius>0.2</radius>
+            </sphere>
+          </geometry>
+        </collision>
+      </link>
+
+      <joint name='left_wheel_joint' type='revolute'>
+        <parent>chassis</parent>
+        <child>left_wheel</child>
+        <axis>
+          <xyz>0 0 1</xyz>
+          <limit>
+            <lower>-1.79769e+308</lower>
+            <upper>1.79769e+308</upper>
+          </limit>
+        </axis>
+      </joint>
+
+      <joint name='right_wheel_joint' type='revolute'>
+        <parent>chassis</parent>
+        <child>right_wheel</child>
+        <axis>
+          <xyz>0 0 1</xyz>
+          <limit>
+            <lower>-1.79769e+308</lower>
+            <upper>1.79769e+308</upper>
+          </limit>
+        </axis>
+      </joint>
+
+      <joint name='caster_wheel' type='ball'>
+        <parent>chassis</parent>
+        <child>caster</child>
+      </joint>
+
+      <joint name='pole_joint' type='revolute'>
+        <pose>0 0 -0.75 0 0 0</pose>
+        <parent>chassis</parent>
+        <child>pole</child>
+        <axis>
+          <xyz>0 1 0</xyz>
+          <limit>
+            <lower>-1.79769e+308</lower>
+            <upper>1.79769e+308</upper>
+          </limit>
+        </axis>
+      </joint>
+
+      <joint name='top_weight' type='fixed'>
+        <parent>pole</parent>
+        <child>pole_mass</child>
+      </joint>
+
+    </model>
+
+  </world>
+</sdf>
diff --git a/examples/scripts/reinforcement_learning/simple_cart_pole/cart_pole_env.py b/examples/scripts/reinforcement_learning/simple_cart_pole/cart_pole_env.py
new file mode 100644
index 0000000000..b45fa9599c
--- /dev/null
+++ b/examples/scripts/reinforcement_learning/simple_cart_pole/cart_pole_env.py
@@ -0,0 +1,120 @@
+
+import os
+import gymnasium as gym
+import numpy as np
+
+from gz.common6 import set_verbosity
+from gz.sim9 import TestFixture, World, world_entity, Model, Link
+from gz.math8 import Vector3d
+from gz.transport14 import Node
+from gz.msgs11.world_control_pb2 import WorldControl
+from gz.msgs11.world_reset_pb2 import WorldReset
+from gz.msgs11.boolean_pb2 import Boolean
+
+from stable_baselines3 import A2C
+
+file_path = os.path.dirname(os.path.realpath(__file__))
+
+class GzRewardScorer:
+    def __init__(self):
+        self.fixture = TestFixture(os.path.join(file_path, 'cart_pole.sdf'))
+        self.fixture.on_pre_update(self.on_pre_update)
+        self.fixture.on_post_update(self.on_post_update)
+        #self.fixture.on_configure(self.on_configure)
+        self.command = None
+        self.first_time = True # Hack cause configure does not work well
+        self.fixture.finalize()
+        self.server = self.fixture.server()
+        self.terminated = False
+
+    def on_pre_update(self, info, ecm):
+        if self.first_time:
+            print("Enabling checks")
+            world = World(world_entity(ecm))
+            self.model = Model(world.model_by_name(ecm, "vehicle_green"))
+            self.pole_entity = self.model.link_by_name(ecm, "pole")
+            self.chassis_entity = self.model.link_by_name(ecm, "chassis")
+            self.pole = Link(self.pole_entity)
+            self.pole.enable_velocity_checks(ecm)
+            self.chassis = Link(self.chassis_entity)
+            self.chassis.enable_velocity_checks(ecm)
+            self.first_time = False
+        if self.command == 1:
+            self.chassis.add_world_force(Vector3d(0, 100, 0))
+        elif self.command == 0:
+            self.chassis.add_world_force(Vector3d(0, -100, 0))
+
+    def on_post_update(self, info, ecm):
+        pole_pose = self.pole.world_pose(ecm).rot().euler().y()
+        if self.pole.world_angular_velocity(ecm) is not None:
+            pole_angular_vel = self.pole.world_angular_velocity(ecm).y()
+        else:
+            pole_angular_vel = 0
+            print("Warning failed to get angular velocity")
+        cart_pose = self.chassis.world_pose(ecm).pos().x()
+        cart_vel = self.chassis.world_linear_velocity(ecm)
+
+        if cart_vel is not None:
+            cart_vel = cart_vel.x()
+        else:
+            cart_vel = 0
+            print("Warning failed to get cart velocity")
+
+        #print("pole", pole_pose)
+        #print("cart", cart_pose)
+        #print("Pole angvel ", pole_angular_vel)
+        self.state = np.array([cart_pose, cart_vel, pole_pose, pole_angular_vel], dtype=np.float32)
+        if not self.terminated:
+            self.terminated = pole_pose > 0.24 or pole_pose < -0.24 or cart_pose > 4.8 or cart_pose < -4.8
+
+        if self.terminated:
+            self.reward = 0.0
+        else:
+            self.reward = 1.0
+
+    def step(self, action, paused=False):
+        self.action = action
+        self.server.run(True, 1, paused)
+        obs = self.state
+        reward = self.reward
+        return obs, reward, self.terminated, False, {}
+
+    def reset(self):
+        print("Resetting")
+        self.server.reset_all()
+        self.first_time = True
+        self.command = None
+        self.terminated = False
+        obs, reward_, term_, tunc_, other_= self.step(None, paused=False)
+        return obs, {}
+
+
+
+class CustomCartPole(gym.Env):
+    def __init__(self, env_config):
+        self.env = GzRewardScorer()
+        #self.server =
+        self.action_space = gym.spaces.Discrete(2)#self.env.action_space
+        self.observation_space = gym.spaces.Box(
+            np.array([-10, float("-inf"), -0.418, -3.4028235e+38]),
+            np.array([10, float("inf"), 0.418, 3.4028235e+38]),
+            (4,), np.float32)
+
+    def reset(self, seed=123):
+        return self.env.reset()
+
+    def step(self, action):
+        obs, reward, done, truncated, info = self.env.step(action)
+        return  obs, reward, done, truncated, info
+
+
+env = CustomCartPole({})
+model = A2C("MlpPolicy", env, verbose=1)
+model.learn(total_timesteps=10_000)
+
+vec_env = model.get_env()
+obs = vec_env.reset()
+for i in range(5000):
+    action, _state = model.predict(obs, deterministic=True)
+    obs, reward, done, info = vec_env.step(action)
+    # Nice to have spawn a gz sim client
\ No newline at end of file