import numpy as np

The document outlines a Python implementation of a Snake game using Q-learning for reinforcement learning. It defines the game environment, including the snake's movement, food placement, and collision detection, as well as a Q-learning agent that learns to play the game through exploration and exploitation. The agent uses a neural network model to predict Q-values for actions based on the game state.

Uploaded by

eelambharati

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

9 views

import numpy as np

Uploaded by

eelambharati

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

You are on page 1/ 5

import numpy as np

import random
import tensorflow as tf
from tensorflow.keras import layers
import pygame
from enum import Enum
from collections import namedtuple

# Q-learning setup
class Direction(Enum):
RIGHT = 1
LEFT = 2
UP = 3
DOWN = 4

Point = namedtuple('Point', 'x, y')

BLOCK_SIZE = 20
SPEED = 10
WHITE = (255, 255, 255)
RED = (200, 0, 0)
BLUE1 = (0, 0, 255)
BLUE2 = (0, 100, 255)
BLACK = (0, 0, 0)

class SnakeGame:
def __init__(self, w=640, h=480):
self.w = w
self.h = h
# init display
self.display = pygame.display.set_mode((self.w, self.h))
pygame.display.set_caption('Snake')
self.clock = pygame.time.Clock()

# init game state

self.direction = Direction.RIGHT
self.head = Point(self.w / 2, self.h / 2)
self.snake = [self.head,
Point(self.head.x - BLOCK_SIZE, self.head.y),
Point(self.head.x - (2 * BLOCK_SIZE), self.head.y)]
self.score = 0
self.food = None
self._place__food()

def _place__food(self):
x = random.randint(0, (self.w - BLOCK_SIZE) // BLOCK_SIZE) * BLOCK_SIZE
y = random.randint(0, (self.h - BLOCK_SIZE) // BLOCK_SIZE) * BLOCK_SIZE
self.food = Point(x, y)
if self.food in self.snake:
self._place__food()

def reset(self):
self.direction = Direction.RIGHT
self.head = Point(self.w / 2, self.h / 2)
self.snake = [self.head,
Point(self.head.x - BLOCK_SIZE, self.head.y),
Point(self.head.x - (2 * BLOCK_SIZE), self.head.y)]
self.score = 0
self._place__food()
return self.get_state()

def get_state(self):
# A simple state representation: head position, direction, food position
return (self.head.x, self.head.y, self.food.x, self.food.y, self.direction.value)
def take_action(self, action):
if action == Direction.RIGHT:
self.direction = Direction.RIGHT
elif action == Direction.LEFT:
self.direction = Direction.LEFT
elif action == Direction.UP:
self.direction = Direction.UP
elif action == Direction.DOWN:
self.direction = Direction.DOWN
self._move(self.direction)

def _move(self, direction):

x = self.head.x
y = self.head.y
if direction == Direction.RIGHT:
x += BLOCK_SIZE
elif direction == Direction.LEFT:
x -= BLOCK_SIZE
elif direction == Direction.DOWN:
y += BLOCK_SIZE
elif direction == Direction.UP:
y -= BLOCK_SIZE
self.head = Point(x, y)

def step(self):
# Calculate reward and check for game over
if self._is_collision():
return self.get_state(), -10, True # Game over
elif self.head == self.food:
self.score += 1
self._place__food()
return self.get_state(), 10, False # Reward for eating food
else:
self.snake.pop()
return self.get_state(), -1, False # Small negative reward to encourage
movement

def _is_collision(self):
# Check if the snake hits the wall or itself
if self.head.x > self.w - BLOCK_SIZE or self.head.x < 0 or self.head.y > self.h
- BLOCK_SIZE or self.head.y < 0:
return True
if self.head in self.snake[1:]:
return True
return False

class QLearningAgent:
def __init__(self, action_space):
self.action_space = action_space
self.model = self.build_model()
self.epsilon = 1.0 # Exploration rate
self.epsilon_min = 0.1
self.epsilon_decay = 0.995
self.gamma = 0.9 # Discount factor
self.learning_rate = 0.001

def build_model(self):
model = tf.keras.Sequential([
layers.Dense(24, input_dim=5, activation='relu'),
layers.Dense(24, activation='relu'),
layers.Dense(4, activation='linear') # 4 possible actions
])
model.compile(loss='mse',
optimizer=tf.keras.optimizers.Adam(learning_rate=self.learning_rate))
return model

def act(self, state):

if np.random.rand() <= self.epsilon:
return random.choice(self.action_space) # Exploration
state = np.array(state).reshape(1, -1)
q_values = self.model.predict(state)
return np.argmax(q_values[0]) # Exploitation

def replay(self, state, action, reward, next_state, done):

target = reward
if not done:
next_state = np.array(next_state).reshape(1, -1)
target = reward + self.gamma * np.max(self.model.predict(next_state)
[0])

state = np.array(state).reshape(1, -1)

target_f = self.model.predict(state)
target_f[0][action]

Design and Implementation of Web Based Human Resource Management
100% (1)
Design and Implementation of Web Based Human Resource Management
10 pages
Sodapdf
No ratings yet
Sodapdf
13 pages
pygame - snake game
No ratings yet
pygame - snake game
6 pages
snake_game.py
No ratings yet
snake_game.py
6 pages
Projek Uler Cobra Jawa
No ratings yet
Projek Uler Cobra Jawa
3 pages
snake_main.py
No ratings yet
snake_main.py
7 pages
inbound6538868606946428776
No ratings yet
inbound6538868606946428776
24 pages
Script Py
No ratings yet
Script Py
3 pages
Snake Game Py
No ratings yet
Snake Game Py
15 pages
cs project snake game
No ratings yet
cs project snake game
11 pages
Snake Game
No ratings yet
Snake Game
19 pages
Snake Game
No ratings yet
Snake Game
5 pages
Código para Crear Snake en Python Con El Módulo Turtle
No ratings yet
Código para Crear Snake en Python Con El Módulo Turtle
6 pages
1. python codes and infos
No ratings yet
1. python codes and infos
5 pages
Snakeee
No ratings yet
Snakeee
7 pages
贪吃蛇
No ratings yet
贪吃蛇
2 pages
Snake Game Made by Python
No ratings yet
Snake Game Made by Python
4 pages
Python
No ratings yet
Python
3 pages
snake game report
No ratings yet
snake game report
6 pages
Message
No ratings yet
Message
3 pages
ARTIFICIAL INTELLIGENCE Lab
No ratings yet
ARTIFICIAL INTELLIGENCE Lab
8 pages
fr_model
No ratings yet
fr_model
8 pages
All
No ratings yet
All
10 pages
RYSg Ni 8 S
No ratings yet
RYSg Ni 8 S
4 pages
5 6203877820083472164.py
No ratings yet
5 6203877820083472164.py
4 pages
Python Project Report
No ratings yet
Python Project Report
11 pages
Python Simple Snake Game v1.0
100% (1)
Python Simple Snake Game v1.0
6 pages
Snake game code aym
No ratings yet
Snake game code aym
3 pages
Fidaki
No ratings yet
Fidaki
3 pages
Games. Py
No ratings yet
Games. Py
2 pages
Sst..Ff - Копия
No ratings yet
Sst..Ff - Копия
3 pages
GD Manual
No ratings yet
GD Manual
35 pages
ponggame (1)
No ratings yet
ponggame (1)
2 pages
Snacks Game
No ratings yet
Snacks Game
3 pages
New Text Document
No ratings yet
New Text Document
3 pages
Game report
No ratings yet
Game report
8 pages
Abhash Fun Snake Game
No ratings yet
Abhash Fun Snake Game
13 pages
New Text Document
No ratings yet
New Text Document
4 pages
Snake Game
No ratings yet
Snake Game
5 pages
Snake game
No ratings yet
Snake game
9 pages
snake game - python code
No ratings yet
snake game - python code
5 pages
xyNbAFCbMH
No ratings yet
xyNbAFCbMH
6 pages
Fop-2 Assignment 2
No ratings yet
Fop-2 Assignment 2
8 pages
MDP Agents 2
No ratings yet
MDP Agents 2
8 pages
ML - 6 - Jupyter Notebook
No ratings yet
ML - 6 - Jupyter Notebook
5 pages
Cobrinha
No ratings yet
Cobrinha
4 pages
CS461 Final Report Team7
No ratings yet
CS461 Final Report Team7
9 pages
Import Pygame
No ratings yet
Import Pygame
3 pages
Practical
No ratings yet
Practical
6 pages
Program Explanation
No ratings yet
Program Explanation
37 pages
5 6 Ai
No ratings yet
5 6 Ai
8 pages
21L7734_Shais_quiz3_aml_8A (1)
No ratings yet
21L7734_Shais_quiz3_aml_8A (1)
25 pages
Import Pygame
No ratings yet
Import Pygame
3 pages
Essay
No ratings yet
Essay
2 pages
Technology
No ratings yet
Technology
7 pages
ANACONDA HALF
No ratings yet
ANACONDA HALF
11 pages
Snakes
No ratings yet
Snakes
3 pages
Cs Project Code Explanation
No ratings yet
Cs Project Code Explanation
13 pages
Snake Game Python
No ratings yet
Snake Game Python
4 pages
SST FF
No ratings yet
SST FF
3 pages
Develop Snake & Ladder Game in an Hour (Complete Guide with Code & Design)
From Everand
Develop Snake & Ladder Game in an Hour (Complete Guide with Code & Design)
Anurag Pandey
No ratings yet
User Instructions: For Smartlf Scan! Large Format Scanner Rev. G June 2016 (F/W 1.01)
No ratings yet
User Instructions: For Smartlf Scan! Large Format Scanner Rev. G June 2016 (F/W 1.01)
25 pages
Various Interface Styles
No ratings yet
Various Interface Styles
45 pages
Expense Tracking Cedric Rey
No ratings yet
Expense Tracking Cedric Rey
4 pages
Full Thesis
No ratings yet
Full Thesis
84 pages
Computer Aided Simulation and Analysis Lab Manual
No ratings yet
Computer Aided Simulation and Analysis Lab Manual
97 pages
XPON ONU、SFP、OLT LIST
No ratings yet
XPON ONU、SFP、OLT LIST
13 pages
Difference Between Semaphore and Monitor
100% (1)
Difference Between Semaphore and Monitor
8 pages
TD Sigma Tracker en
No ratings yet
TD Sigma Tracker en
2 pages
General Purpose Simulation System (GPSS)
No ratings yet
General Purpose Simulation System (GPSS)
14 pages
Non-Immigrant Visa - Review Personal, Address, Phone, and Passport Information
No ratings yet
Non-Immigrant Visa - Review Personal, Address, Phone, and Passport Information
2 pages
For Batches 2021 & Onwards SBSSU, Gurdaspur, Recognized Under Section 2 (F) of UGC Act, 1956
No ratings yet
For Batches 2021 & Onwards SBSSU, Gurdaspur, Recognized Under Section 2 (F) of UGC Act, 1956
9 pages
Hexadecimal Ensamblador
No ratings yet
Hexadecimal Ensamblador
8 pages
User Manual: Samsung Medison Diagnostic Ultrasound System
100% (1)
User Manual: Samsung Medison Diagnostic Ultrasound System
702 pages
Siebel Insurance Guide: June 2004
No ratings yet
Siebel Insurance Guide: June 2004
138 pages
Little Book Scam PDF
75% (4)
Little Book Scam PDF
52 pages
LINCOLN UNIVERSITY STUDENT I
No ratings yet
LINCOLN UNIVERSITY STUDENT I
3 pages
Professional Ethics & Codes of Conduct
No ratings yet
Professional Ethics & Codes of Conduct
27 pages
Sppu CG Papers 23
No ratings yet
Sppu CG Papers 23
6 pages
Artificial Intelligence Tutorial PDF
100% (2)
Artificial Intelligence Tutorial PDF
69 pages
Computational Fluid Dynamics Assignment 2
No ratings yet
Computational Fluid Dynamics Assignment 2
20 pages
Cncvietpro DDCS V3.1
No ratings yet
Cncvietpro DDCS V3.1
44 pages
Tutorial (Chapter 9)
No ratings yet
Tutorial (Chapter 9)
4 pages
Omicron CMC356 Relay Test With Advanced Protection Software Datasheet
No ratings yet
Omicron CMC356 Relay Test With Advanced Protection Software Datasheet
8 pages
(WWW - Entrance-Exam - Net) - Accenture Sample Paper 5
No ratings yet
(WWW - Entrance-Exam - Net) - Accenture Sample Paper 5
2 pages
Chapter_Addressing Modes_Instruction Encoding - Chapter
No ratings yet
Chapter_Addressing Modes_Instruction Encoding - Chapter
41 pages
10gbe Data Center Switch Bare-Metal Hardware: Datasheet
No ratings yet
10gbe Data Center Switch Bare-Metal Hardware: Datasheet
4 pages
C50XFR Series Manual - English
No ratings yet
C50XFR Series Manual - English
96 pages
Customer Ageing Logics
No ratings yet
Customer Ageing Logics
4 pages

import numpy as np

Uploaded by

import numpy as np

Uploaded by

import numpy as np

Point = namedtuple('Point', 'x, y')

# init game state

def _move(self, direction):

def act(self, state):

def replay(self, state, action, reward, next_state, done):

state = np.array(state).reshape(1, -1)

You might also like