cse151b-final-project/dqn_wordle.py

import gym
import sys
from stable_baselines3 import DQN
from stable_baselines3.common.env_util import make_vec_env
import wordle_gym
import numpy as np
from tqdm import tqdm

def train (model, env, total_timesteps = 100000): 
    model.learn(total_timesteps=total_timesteps, progress_bar=True)
    model.save("dqn_wordle")

def test(model, env, test_num=1000):

    total_correct = 0

    for i in tqdm(range(test_num)):

        model = DQN.load("dqn_wordle")

        env = gym.make("wordle-v0")
        obs = env.reset()
        done = False
        while not done:
            action, _states = model.predict(obs)
            obs, rewards, done, info = env.step(action)

            print(action, obs, rewards)

    return total_correct / test_num

if __name__ == "__main__":
    
    env = gym.make("wordle-v0")
    model = DQN("MlpPolicy", env, verbose=0)
    print(env)
    print(model)

    train(model, env, total_timesteps=10000)
    print(test(model, env, test_num=1))
still doesnt train 2024-03-14 04:36:26 +00:00			`import gym`
			`import sys`
attempt to use the other wordle gym, causing cuda errors 2024-03-13 21:27:34 +00:00			`from stable_baselines3 import DQN`
still doesnt train 2024-03-14 04:36:26 +00:00			`from stable_baselines3.common.env_util import make_vec_env`
			`import wordle_gym`
attempt to use the other wordle gym, causing cuda errors 2024-03-13 21:27:34 +00:00			`import numpy as np`
still doesnt train 2024-03-14 04:36:26 +00:00			`from tqdm import tqdm`
attempt to use the other wordle gym, causing cuda errors 2024-03-13 21:27:34 +00:00
still doesnt train 2024-03-14 04:36:26 +00:00			`def train (model, env, total_timesteps = 100000):`
			`model.learn(total_timesteps=total_timesteps, progress_bar=True)`
			`model.save("dqn_wordle")`
attempt to use the other wordle gym, causing cuda errors 2024-03-13 21:27:34 +00:00
still doesnt train 2024-03-14 04:36:26 +00:00			`def test(model, env, test_num=1000):`
attempt to use the other wordle gym, causing cuda errors 2024-03-13 21:27:34 +00:00
still doesnt train 2024-03-14 04:36:26 +00:00			`total_correct = 0`
attempt to use the other wordle gym, causing cuda errors 2024-03-13 21:27:34 +00:00
still doesnt train 2024-03-14 04:36:26 +00:00			`for i in tqdm(range(test_num)):`
attempt to use the other wordle gym, causing cuda errors 2024-03-13 21:27:34 +00:00
still doesnt train 2024-03-14 04:36:26 +00:00			`model = DQN.load("dqn_wordle")`
attempt to use the other wordle gym, causing cuda errors 2024-03-13 21:27:34 +00:00
still doesnt train 2024-03-14 04:36:26 +00:00			`env = gym.make("wordle-v0")`
			`obs = env.reset()`
attempt to use the other wordle gym, causing cuda errors 2024-03-13 21:27:34 +00:00			`done = False`
			`while not done:`
still doesnt train 2024-03-14 04:36:26 +00:00			`action, _states = model.predict(obs)`
			`obs, rewards, done, info = env.step(action)`
attempt to use the other wordle gym, causing cuda errors 2024-03-13 21:27:34 +00:00
still doesnt train 2024-03-14 04:36:26 +00:00			`print(action, obs, rewards)`
attempt to use the other wordle gym, causing cuda errors 2024-03-13 21:27:34 +00:00
still doesnt train 2024-03-14 04:36:26 +00:00			`return total_correct / test_num`
attempt to use the other wordle gym, causing cuda errors 2024-03-13 21:27:34 +00:00
still doesnt train 2024-03-14 04:36:26 +00:00			`if __name__ == "__main__":`

			`env = gym.make("wordle-v0")`
			`model = DQN("MlpPolicy", env, verbose=0)`
			`print(env)`
			`print(model)`
attempt to use the other wordle gym, causing cuda errors 2024-03-13 21:27:34 +00:00
still doesnt train 2024-03-14 04:36:26 +00:00			`train(model, env, total_timesteps=10000)`
			`print(test(model, env, test_num=1))`