Q4.ipynb - Colab

Uploaded by

Rahul me20b145

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

19 views4 pages

Q4.ipynb - Colab

Uploaded by

Rahul me20b145

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 4

5/12/24, 8:37 AM Q4.

ipynb - Colab

1 import numpy as np
2 import time

1 class Agent:
2 def __init__(self, num_balls, num_matches):
3 self.total_wickets = 4
4 self.num_balls = num_balls
5 self.num_matches = num_matches
6 self.q_values = np.ndarray(
7 (self.num_balls, self.total_wickets, 6), dtype=np.float32
8 )
9 self.q_values.fill(0)
10
11 self.epsilon = 0.1
12 self.balls = 0
13 self.wickets = 0
14
15 self.alpha = 0.1
16 self.gamma = 0.9
17
18 self.last_action = None
19
20 self.policy_type = "e-greedy" # e-greedy, softmax
21 self.algo = "sarsa" # q-learning, sarsa
22
23 self.next_action = None
24
25 def policy(self):
26 if self.policy_type == "e-greedy":
27 p = np.random.rand()
28 if p < self.epsilon:
29 return np.random.randint(0, 6)
30 else:
31 return np.argmax(self.q_values[self.balls][self.wickets])
32
33 elif self.policy_type == "softmax":
34 if np.sum(np.exp(self.q_values[self.balls][self.wickets])) == 0:
35 return np.random.randint(0, 6)
36
37 probabilities = np.exp(self.q_values[self.balls][self.wickets]) / np.sum(
38 np.exp(self.q_values[self.balls][self.wickets])
39 )
40 return np.random.choice(range(6), p=probabilities)
41
42 def get_action(self, wicket, runs_scored):
43 if self.balls == 0:
44 self.last_action = self.policy()
45 self.balls += 1
46 return self.last_action
47
48 self.wickets = self.wickets + wicket
49 self.balls += 1
50
51 if self.balls == self.num_balls or self.wickets == self.total_wickets:
52 self.balls = 0
53 self.wickets = 0
54 self.last_action = None
55 self.next_action = None
56
57 self.last_action = self.policy()
58 self.balls += 1
59 return self.last_action
60
61 new_q_value = 0
62 if self.algo == "q-learning":
63 new_q_value = (
64 runs_scored
65 - 0.5
66 + self.gamma * np.max(self.q_values[self.balls][self.wickets])
67 - self.q values[self.balls - 1][self.wickets - wicket][self.last action]
https://colab.research.google.com/drive/1_qSwQRhp60THO4Tt1TbNkUKWXDEbqrI0#printMode=true 1/4
5/12/24, 8:37 AM Q4.ipynb - Colab
67 self.q_values[self.balls 1][self.wickets wicket][self.last_action]
68 )
69 elif self.algo == "sarsa":
70 self.next_action = self.policy()
71 new_q_value = (
72 runs_scored
73 - 0.5
74 + self.gamma * self.q_values[self.balls][self.wickets][self.next_action]
75 - self.q_values[self.balls - 1][self.wickets - wicket][self.last_action]
76 )
77
78 self.q_values[self.balls - 1][self.wickets - wicket][self.last_action] += (
79 self.alpha * new_q_value
80 )
81
82 if self.algo == "q-learning":
83 self.next_action = self.policy()
84
85 self.last_action = self.next_action
86 return self.last_action

https://colab.research.google.com/drive/1_qSwQRhp60THO4Tt1TbNkUKWXDEbqrI0#printMode=true 2/4
5/12/24, 8:37 AM Q4.ipynb - Colab
1 wickets = 4
2
3
4 class Environment:
5 def __init__(self, num_balls, agent):
6 self.num_balls = num_balls
7 self.agent = agent
8 self.__run_time = 0
9 self.__total_runs = 0
10 self.__total_wickets = 0
11 self.__runs_scored = 0
12 self.__start_time = 0
13 self.__end_time = 0
14 self.__p_out = np.array([0.001, 0.01, 0.02, 0.03, 0.1, 0.3])
15 self.__p_run = np.array([1, 0.9, 0.85, 0.8, 0.75, 0.7])
16 self.__action_runs_map = np.array([0, 1, 2, 3, 4, 6])
17 self.__wickets_left = wickets
18 self.__wicket = 0
19 self.__runs_scored = 0
20 self.__start_time = 0
21 self.__end_time = 0
22 self.__batting_order = np.array([0, 1, 2, 3])
23
24 def __get_action(self):
25 self.__start_time = time.time()
26 action = self.agent.get_action(self.__wicket, self.__runs_scored)
27 self.__end_time = time.time()
28 self.__run_time = self.__run_time + self.__end_time - self.__start_time
29 return action
30
31 def __get_outcome(self, action):
32 pout = self.__p_out[action]
33 prun = self.__p_run[action]
34 wicket = np.random.choice(2, 1, p=[1 - pout, pout])[0]
35 runs = 0
36 if wicket == 0:
37 runs = (
38 self.__action_runs_map[action]
39 * np.random.choice(2, 1, p=[1 - prun, prun])[0]
40 )
41 return wicket, runs
42
43 def innings(self):
44 self.__wickets_left = wickets
45 self.__runs_scored = 0
46 self.__total_runs = 0
47 self.__total_wickets = 0
48 self.__run_time = 0
49 self.__start_time = 0
50 self.__end_time = 0
51
52 for ball in range(self.num_balls):
53 if self.__wickets_left > 0:
54 action = self.__get_action()
55 self.__wicket, self.__runs_scored = self.__get_outcome(action)
56 self.__total_runs = self.__total_runs + self.__runs_scored
57 if self.__wicket > 0:
58 self.__wickets_left = self.__wickets_left - 1
59 self.__total_wickets = self.__total_wickets + self.__wicket
60 if self.__wickets_left == 0:
61 self.__get_action()
62 return self.__total_runs, self.__total_wickets, self.__run_time

https://colab.research.google.com/drive/1_qSwQRhp60THO4Tt1TbNkUKWXDEbqrI0#printMode=true 3/4
5/12/24, 8:37 AM Q4.ipynb - Colab
1 num_matches = 10000
2 num_balls = 60
3 agent = Agent(num_balls, num_matches)
4 environment = Environment(num_balls, agent)
5 score = np.zeros((num_matches, 1))
6 run_time = np.zeros((num_matches, 1))
7 wicket = np.zeros((num_matches, 1))
8
9 last_100_avgs = []
10 for i in range(num_matches):
11 score[i], wicket[i], run_time[i] = environment.innings()
12 last_100_avgs.append(score[i])
13 if (i + 1) % 100 == 0:
14 print("Match: ", i + 1, "Average: ", np.mean(last_100_avgs))
15 last_100_avgs = []

Match: 100 Average: 78.11

Match: 200 Average: 85.15
Match: 300 Average: 84.2
Match: 400 Average: 84.91
Match: 500 Average: 85.31
Match: 600 Average: 87.86
Match: 700 Average: 80.53
Match: 800 Average: 82.99
Match: 900 Average: 85.48
Match: 1000 Average: 83.93
Match: 1100 Average: 81.83
Match: 1200 Average: 84.81
Match: 1300 Average: 89.8
Match: 1400 Average: 90.11
Match: 1500 Average: 86.59
Match: 1600 Average: 91.43
Match: 1700 Average: 84.69
Match: 1800 Average: 85.3
Match: 1900 Average: 94.17
Match: 2000 Average: 87.65
Match: 2100 Average: 87.38

https://colab.research.google.com/drive/1_qSwQRhp60THO4Tt1TbNkUKWXDEbqrI0#printMode=true 4/4

Essentials of Sociology 4th Edition Giddens Carr Ebook and TestBank Bundle Download Instantly
No ratings yet
Essentials of Sociology 4th Edition Giddens Carr Ebook and TestBank Bundle Download Instantly
323 pages
Traffic Engineering Lab Guide IITG
No ratings yet
Traffic Engineering Lab Guide IITG
101 pages
Ancient Psychomusicology Studies
No ratings yet
Ancient Psychomusicology Studies
557 pages
(Ebook) Intelligent Materials by M. Shahinpoor, M. Shahinpoor, H-J. Schneider ISBN 9780854043354, 0854043357 PDF Download
100% (1)
(Ebook) Intelligent Materials by M. Shahinpoor, M. Shahinpoor, H-J. Schneider ISBN 9780854043354, 0854043357 PDF Download
47 pages
MBBS/BDS (Management Quota) Course Session:2022 - 2023 Provisional List of Candidates Allotted On - 26.11.2022
No ratings yet
MBBS/BDS (Management Quota) Course Session:2022 - 2023 Provisional List of Candidates Allotted On - 26.11.2022
161 pages
Well Logging Data Acquisition and Applications Serra Oberto Serra Download
No ratings yet
Well Logging Data Acquisition and Applications Serra Oberto Serra Download
39 pages
Directing and Producing A Stage Play
No ratings yet
Directing and Producing A Stage Play
5 pages
An Assignment On Social Change & Development
No ratings yet
An Assignment On Social Change & Development
16 pages
Q3 (1) .Ipynb - Colab
No ratings yet
Q3 (1) .Ipynb - Colab
3 pages
Q3.ipynb - Colab
No ratings yet
Q3.ipynb - Colab
3 pages
Domatia
No ratings yet
Domatia
6 pages
Q2.ipynb - Colab
No ratings yet
Q2.ipynb - Colab
3 pages
Q1.ipynb - Colab
No ratings yet
Q1.ipynb - Colab
3 pages
European Steel and Alloy Grades: 10crmo9-10 (1.7380)
No ratings yet
European Steel and Alloy Grades: 10crmo9-10 (1.7380)
3 pages
Classification of Living Things
No ratings yet
Classification of Living Things
6 pages
PYP Student Planner Guide
No ratings yet
PYP Student Planner Guide
31 pages
Proposal Nia
No ratings yet
Proposal Nia
23 pages
Ce Laws-Reviewer-Prelim
No ratings yet
Ce Laws-Reviewer-Prelim
9 pages
Frozen Lake
No ratings yet
Frozen Lake
2 pages
8 Vertical Stresses Below Applied Loads
No ratings yet
8 Vertical Stresses Below Applied Loads
13 pages
CS6700 Reinforcement Learning Assignment
No ratings yet
CS6700 Reinforcement Learning Assignment
17 pages
q3 Performance Task 1
No ratings yet
q3 Performance Task 1
4 pages
9922 30210 2 PB
No ratings yet
9922 30210 2 PB
9 pages
Porosity and Lithology Determination From Formation Density Log and SNP Sidewall Neutron Porosity Log
No ratings yet
Porosity and Lithology Determination From Formation Density Log and SNP Sidewall Neutron Porosity Log
1 page
L2 Projection Piecewise
No ratings yet
L2 Projection Piecewise
9 pages
Hammer NumericalIntegrationSimplexes 1956
No ratings yet
Hammer NumericalIntegrationSimplexes 1956
9 pages
General Guidelines and Procedures Protocolo de Interpretacion
No ratings yet
General Guidelines and Procedures Protocolo de Interpretacion
12 pages
Quick Guide FDX Console
No ratings yet
Quick Guide FDX Console
5 pages
AA19320
No ratings yet
AA19320
6 pages
Gauss Legendre Quadrature Method
No ratings yet
Gauss Legendre Quadrature Method
7 pages
Assignment EE5179 ME20B145 Report
No ratings yet
Assignment EE5179 ME20B145 Report
6 pages
WBGCore Competencies Final
No ratings yet
WBGCore Competencies Final
12 pages
CS6700 RL 2024 Wa1
No ratings yet
CS6700 RL 2024 Wa1
7 pages
API Mud Balance Instruction Guide
No ratings yet
API Mud Balance Instruction Guide
6 pages
Form Four Geo-1
No ratings yet
Form Four Geo-1
6 pages
Quadrature Rules For Numerical Integration Over Triangles and Tetrahedra
No ratings yet
Quadrature Rules For Numerical Integration Over Triangles and Tetrahedra
3 pages
Homework 1: ELEN E6885: Introduction To Reinforcement Learning September 21, 2021
No ratings yet
Homework 1: ELEN E6885: Introduction To Reinforcement Learning September 21, 2021
8 pages
Gujarat Technological University
No ratings yet
Gujarat Technological University
1 page
Mastering Metrics Published
No ratings yet
Mastering Metrics Published
4 pages
Metal Granulation Solutions
No ratings yet
Metal Granulation Solutions
1 page
DEL MAA: Rahul / Rahul MR AI0538
No ratings yet
DEL MAA: Rahul / Rahul MR AI0538
1 page
Factors in Predicting Health Behaviors Lecture
No ratings yet
Factors in Predicting Health Behaviors Lecture
20 pages
Final Trulytruly Code
No ratings yet
Final Trulytruly Code
13 pages
Output Code
No ratings yet
Output Code
2 pages
RLDL File
No ratings yet
RLDL File
31 pages
Assignment 12: Introduction To Machine Learning Prof. B. Ravindran
100% (1)
Assignment 12: Introduction To Machine Learning Prof. B. Ravindran
4 pages
Import Pandas As PD Import Numpy As NP From Sklearn Import Datasets Def Expectation - Max (Data, Max - Iter 1000)
No ratings yet
Import Pandas As PD Import Numpy As NP From Sklearn Import Datasets Def Expectation - Max (Data, Max - Iter 1000)
1 page
ML - 6 - Jupyter Notebook
No ratings yet
ML - 6 - Jupyter Notebook
5 pages
Scaffold Erection NC2 Cert
No ratings yet
Scaffold Erection NC2 Cert
1 page
Py Code Example 11 0 Baird Semi Gradient DP Like
No ratings yet
Py Code Example 11 0 Baird Semi Gradient DP Like
3 pages
RLAI Lab 1 Rahel Benjamin
No ratings yet
RLAI Lab 1 Rahel Benjamin
16 pages
Class ActorCritic
No ratings yet
Class ActorCritic
1 page
Frozen Lake
No ratings yet
Frozen Lake
6 pages
Generalization Limits Dynamics Randomization Report
No ratings yet
Generalization Limits Dynamics Randomization Report
4 pages
Dream Team
No ratings yet
Dream Team
4 pages
21L7734 Shais Quiz3 Aml 8A
No ratings yet
21L7734 Shais Quiz3 Aml 8A
25 pages
Practical No4,5
No ratings yet
Practical No4,5
7 pages
AI 3000 / CS 5500: Reinforcement Learning Assignment 1: Problem 1: Markov Reward Process
No ratings yet
AI 3000 / CS 5500: Reinforcement Learning Assignment 1: Problem 1: Markov Reward Process
5 pages
Cricket Score Python Automation Description
No ratings yet
Cricket Score Python Automation Description
3 pages
Class-Work-1 (26-08-2024)
No ratings yet
Class-Work-1 (26-08-2024)
5 pages
Uploads 3
No ratings yet
Uploads 3
2 pages
Treasure Island MDP Using Value Iteration: Python Code
No ratings yet
Treasure Island MDP Using Value Iteration: Python Code
5 pages
Ass1 Merged Merged
No ratings yet
Ass1 Merged Merged
19 pages
10.Q Learning Algorithm
No ratings yet
10.Q Learning Algorithm
2 pages
Bayesian Decision Theory Quiz
No ratings yet
Bayesian Decision Theory Quiz
6 pages
Group 20 Lab 6
No ratings yet
Group 20 Lab 6
15 pages
HW2 - 110306073.ipynb - Colaboratory
No ratings yet
HW2 - 110306073.ipynb - Colaboratory
3 pages
Solutions - REINFORCE and Linear Function Approximation
No ratings yet
Solutions - REINFORCE and Linear Function Approximation
5 pages
PandasAI + Cricket
No ratings yet
PandasAI + Cricket
10 pages
DRL - AI309 - A - Assignment - 1 - F24 - GIKI
No ratings yet
DRL - AI309 - A - Assignment - 1 - F24 - GIKI
3 pages
FrozenLake Q-Learning Guide
No ratings yet
FrozenLake Q-Learning Guide
4 pages
Reinforcement Learning - Project 3
No ratings yet
Reinforcement Learning - Project 3
9 pages
Exam Prep Exercises034534123124
No ratings yet
Exam Prep Exercises034534123124
20 pages
Cricket Match Simulation Data
No ratings yet
Cricket Match Simulation Data
752 pages
Genetic Bee Colony
No ratings yet
Genetic Bee Colony
22 pages
Tugas 2 Grid World
No ratings yet
Tugas 2 Grid World
7 pages
Game Theory Strategies Code Examples
No ratings yet
Game Theory Strategies Code Examples
10 pages
1 - All Python Codes + Neo4j Samples
No ratings yet
1 - All Python Codes + Neo4j Samples
16 pages
RLDL
No ratings yet
RLDL
23 pages
Abu Minhaj Farooqi 37560 Ai Lab Final Exam
No ratings yet
Abu Minhaj Farooqi 37560 Ai Lab Final Exam
14 pages
RL Unit V Qa
No ratings yet
RL Unit V Qa
13 pages
Machine Learning Lab (3) Report (21 CP 81)
No ratings yet
Machine Learning Lab (3) Report (21 CP 81)
7 pages
Technology
No ratings yet
Technology
7 pages
SRM Eswari Workshop Day 1 - Feb 2025 - Jupyter Notebook
No ratings yet
SRM Eswari Workshop Day 1 - Feb 2025 - Jupyter Notebook
39 pages
Ai Lab
No ratings yet
Ai Lab
15 pages
REINFORCE Algorithm Python Guide
No ratings yet
REINFORCE Algorithm Python Guide
15 pages
Sindhuja Assignment-2 AI
No ratings yet
Sindhuja Assignment-2 AI
22 pages
Python Neural Network and Perceptron Guide
No ratings yet
Python Neural Network and Perceptron Guide
6 pages
Ass1 Merged Merged
No ratings yet
Ass1 Merged Merged
15 pages
35 Case Syntax
No ratings yet
35 Case Syntax
269 pages
AAL Programs
No ratings yet
AAL Programs
12 pages
Policy Gradient Methods Guide
No ratings yet
Policy Gradient Methods Guide
28 pages
Assignment 1
No ratings yet
Assignment 1
24 pages

Q4.ipynb - Colab

Uploaded by

Q4.ipynb - Colab

Uploaded by

5/12/24, 8:37 AM Q4.

Match: 100 Average: 78.11

You might also like