Skip to content

Instantly share code, notes, and snippets.

@NeelMishra
NeelMishra / gist:9e47aebcdef11c4fed0920de3b89e170
Created January 15, 2025 15:09
Monte Carlo Cart Pole Balancing with Epsilon Greedy Policy Improvement
import gymnasium as gym
import numpy as np
class MonteCarloCartPole:
def __init__(self, n_bins=10, learning_rate=0.1, gamma=0.99, epsilon=0.1):
self.env = gym.make('CartPole-v1')
self.n_bins = n_bins
self.learning_rate = learning_rate
self.gamma = gamma
self.epsilon = epsilon