Professional Documents
Culture Documents
Son
Son
Son
class SONAgent:
def __init__(self, num_cells, num_actions):
self.num_cells = num_cells
self.num_actions = num_actions
self.q_table = np.zeros((num_cells, num_actions))
class Testbed:
def __init__(self, num_cells):
self.num_cells = num_cells
self.current_cell = np.random.randint(num_cells)
# Parameters
num_cells = 10
num_actions = 3
learning_rate = 0.1
discount_factor = 0.9
num_episodes = 1000
# Training loop
for episode in range(num_episodes):
total_reward = 0
testbed.current_cell = np.random.randint(num_cells) # Random initial cell for
each episode
if episode % 100 == 0:
print(f"Episode {episode}, Total Reward: {total_reward}")