0% found this document useful (0 votes)

27 views3 pages

Q1.ipynb - Colab

Uploaded by

Rahul me20b145

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

27 views3 pages

Q1.ipynb - Colab

Uploaded by

Rahul me20b145

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 3

5/12/24, 8:36 AM Q1.

ipynb - Colab

1 import numpy as np
2 import time

1 class Agent:
2 def __init__(self):
3 self.balls_played = 0
4 self.runs_scored = 0
5 self.wickets_down = 0
6 self.last_played = 0
7 self.total_reward = 0
8
9 self.pulls = np.zeros(6, dtype=np.int32)
10 self.arm_rewards = np.zeros(6, dtype=np.int32)
11
12 self.ucb_arms = np.zeros(6, dtype=np.float32)
13
14 def kl_divergence(self, p, q):
15 if p == 0 or q == 0:
16 return 0
17 return p * np.log(p / q) + (1 - p) * np.log((1 - p) / (1 - q))
18
19 def solve_q(self, rhs, p_a):
20 if p_a == 1:
21 return 1
22
23 q_s = np.arange(p_a, 1, 0.01)
24 lhs = np.zeros(q_s.shape)
25
26 for i, q in enumerate(q_s):
27 lhs[i] = self.kl_divergence(p_a, q)
28
29 lhs_rhs = lhs - rhs
30 lhs_rhs[lhs_rhs <= 0] = np.inf
31 q = q_s[np.argmin(lhs_rhs)]
32
33 return q
34
35 def calculate_ucb(self):
36 for action in range(6):
37 p_a = self.arm_rewards[action] / self.pulls[action]
38 rhs = (
39 np.log(self.balls_played) + 3 * np.log(np.log(self.balls_played))
40 ) / self.pulls[action]
41 self.ucb_arms[action] = self.solve_q(rhs, p_a)
42
43 def get_action(self, wicket, runs_scored):
44 action = None
45
46 if self.balls_played == 0:
47 action = 0
48 self.last_played = action
49 self.balls_played += 1
50 return action
51 else:
52 self.runs_scored += runs_scored
53 self.wickets_down += wicket
54 self.total_reward += 1 - wicket
55
56 self.arm_rewards[self.last_played] += 1 - wicket
57 self.pulls[self.last_played] += 1
58
59 if self.balls_played < 6:
60 action = self.balls_played
61 else:
62 self.calculate_ucb()
63 maxucb = np.amax(self.ucb_arms)
64 indices = np.where(self.ucb_arms == maxucb)
65 action = np.amax(indices)
66
67 self.last played = action
https://colab.research.google.com/drive/1WseZcW4oq6tTOXqnuRpoeqsV--4EJkkb#printMode=true 1/3
5/12/24, 8:36 AM Q1.ipynb - Colab
67 self.last_played action
68 self.balls_played += 1
69 return action

1 class Environment:
2 def __init__(self, num_balls, agent):
3 self.num_balls = num_balls
4 self.agent = agent
5 self.__run_time = 0
6 self.__total_runs = 0
7 self.__total_wickets = 0
8 self.__runs_scored = 0
9 self.__start_time = 0
10 self.__end_time = 0
11 self.__regret_w = 0
12 self.__regret_s = 0
13 self.__wicket = 0
14 self.__regret_rho = 0
15 self.__p_out = np.array([0.001, 0.01, 0.02, 0.03, 0.1, 0.3])
16 self.__p_run = np.array([1, 0.9, 0.85, 0.8, 0.75, 0.7])
17 self.__action_runs_map = np.array([0, 1, 2, 3, 4, 6])
18 self.__s = (1 - self.__p_out) * self.__p_run * self.__action_runs_map
19 self.__rho = self.__s / self.__p_out
20
21 def __get_action(self):
22 self.__start_time = time.time()
23 action = self.agent.get_action(self.__wicket, self.__runs_scored)
24 self.__end_time = time.time()
25 self.__run_time = self.__run_time + self.__end_time - self.__start_time
26 return action
27
28 def __get_outcome(self, action):
29 pout = self.__p_out[action]
30 prun = self.__p_run[action]
31 wicket = np.random.choice(2, 1, p=[1 - pout, pout])[0]
32 runs = 0
33 if wicket == 0:
34 runs = (
35 self.__action_runs_map[action]
36 * np.random.choice(2, 1, p=[1 - prun, prun])[0]
37 )
38 return wicket, runs
39
40 def innings(self):
41 self.__total_runs = 0
42 self.__total_wickets = 0
43 self.__runs_scored = 0
44
45 for ball in range(self.num_balls):
46 action = self.__get_action()
47 self.__wicket, self.__runs_scored = self.__get_outcome(action)
48 self.__total_runs = self.__total_runs + self.__runs_scored
49 self.__total_wickets = self.__total_wickets + self.__wicket
50 self.__regret_w = self.__regret_w + (
51 self.__p_out[action] - np.min(self.__p_out)
52 )
53 self.__regret_s = self.__regret_s + (np.max(self.__s) - self.__s[action])
54 self.__regret_rho = self.__regret_rho + (
55 np.max(self.__rho) - self.__rho[action]
56 )
57 return (
58 self.__regret_w,
59 self.__regret_s,
60 self.__regret_rho,
61 self.__total_runs,
62 self.__total_wickets,
63 self.__run_time,
64 )

https://colab.research.google.com/drive/1WseZcW4oq6tTOXqnuRpoeqsV--4EJkkb#printMode=true 2/3
5/12/24, 8:36 AM Q1.ipynb - Colab
1 agent = Agent()
2 environment = Environment(1000, agent)
3 regret_w, regret_s, reger_rho, total_runs, total_wickets, run_time = (
4 environment.innings()
5 )
6
7 print(regret_w, regret_s, reger_rho, total_runs, total_wickets, run_time)

4.189999999999989 2660.071000000038 70547.89999999957 292 7 0.17612314224243164

https://colab.research.google.com/drive/1WseZcW4oq6tTOXqnuRpoeqsV--4EJkkb#printMode=true 3/3

Road To IELTS
0% (1)
Road To IELTS
3 pages
GII GRIN SCIE Conference Rating 1 Giu 2017 10.36.57 Output
No ratings yet
GII GRIN SCIE Conference Rating 1 Giu 2017 10.36.57 Output
330 pages
Q2.ipynb - Colab
No ratings yet
Q2.ipynb - Colab
3 pages
Q3.ipynb - Colab
No ratings yet
Q3.ipynb - Colab
3 pages
Q3 (1) .Ipynb - Colab
No ratings yet
Q3 (1) .Ipynb - Colab
3 pages
# Gradient Descent #Start #Learning Rate: November 6, 2024
No ratings yet
# Gradient Descent #Start #Learning Rate: November 6, 2024
418 pages
35 Case Syntax
No ratings yet
35 Case Syntax
269 pages
Q4.ipynb - Colab
No ratings yet
Q4.ipynb - Colab
4 pages
DMA - Sprufb8d
No ratings yet
DMA - Sprufb8d
43 pages
Ass1 Merged Merged
No ratings yet
Ass1 Merged Merged
19 pages
C1 W1
No ratings yet
C1 W1
17 pages
Angela Merkel Report Group3
100% (1)
Angela Merkel Report Group3
13 pages
Fuzzy Set
No ratings yet
Fuzzy Set
20 pages
Dindigul School of TNPSC: Indian Economy
No ratings yet
Dindigul School of TNPSC: Indian Economy
4 pages
Practical 5
No ratings yet
Practical 5
13 pages
Walchand Institute of Technology, Solapur Information Technology 2021-22 SEMESTER - I
No ratings yet
Walchand Institute of Technology, Solapur Information Technology 2021-22 SEMESTER - I
5 pages
Module 3 DLC Arq
No ratings yet
Module 3 DLC Arq
81 pages
Weka
No ratings yet
Weka
5 pages
ML - 6 - Jupyter Notebook
No ratings yet
ML - 6 - Jupyter Notebook
5 pages
ODDS RATIO Dari Excel
No ratings yet
ODDS RATIO Dari Excel
5 pages
HW - 2
No ratings yet
HW - 2
4 pages
Machine Learning Lab (3) Report (21 CP 81)
No ratings yet
Machine Learning Lab (3) Report (21 CP 81)
7 pages
DM Lab 7.ipynb - Colaboratory
No ratings yet
DM Lab 7.ipynb - Colaboratory
3 pages
Problem Solving Skills Kepner Tregoe Solution
No ratings yet
Problem Solving Skills Kepner Tregoe Solution
114 pages
AI Lab10
No ratings yet
AI Lab10
4 pages
Plotting_polynomials_01
No ratings yet
Plotting_polynomials_01
24 pages
Rationalism and Scientific Temper Presentation
100% (1)
Rationalism and Scientific Temper Presentation
13 pages
Experiment 4
No ratings yet
Experiment 4
7 pages
Project1 2022 Fall
No ratings yet
Project1 2022 Fall
4 pages
Board of Directors: Search TC
No ratings yet
Board of Directors: Search TC
13 pages
vertopal.com_5. BackPropagation
No ratings yet
vertopal.com_5. BackPropagation
8 pages
Alkydprimer: Technical Data Sheet
No ratings yet
Alkydprimer: Technical Data Sheet
5 pages
CS6700 Programming Assignment 2
No ratings yet
CS6700 Programming Assignment 2
17 pages
Matlab Code For Power Consumption
No ratings yet
Matlab Code For Power Consumption
2 pages
import gym
No ratings yet
import gym
4 pages
# ELG 5255 Applied Machine Learning Fall 2020 # Assignment 3 (Multivariate Method)
No ratings yet
# ELG 5255 Applied Machine Learning Fall 2020 # Assignment 3 (Multivariate Method)
8 pages
How To Take Care of An Egg Baby Project
0% (1)
How To Take Care of An Egg Baby Project
3 pages
Machine Learning
No ratings yet
Machine Learning
31 pages
S. No. Educ Ation Salar y Dum My - H S Dum My - G Dum My - P G
No ratings yet
S. No. Educ Ation Salar y Dum My - H S Dum My - G Dum My - P G
5 pages
ADADELTA
No ratings yet
ADADELTA
2 pages
21 CP 46 - (ML LAB 3)
No ratings yet
21 CP 46 - (ML LAB 3)
13 pages
Rating
No ratings yet
Rating
1 page
Pseudo Code For Go Daddy Go and Point Eval
No ratings yet
Pseudo Code For Go Daddy Go and Point Eval
3 pages
Scoa Codes
No ratings yet
Scoa Codes
9 pages
Cricket Score Python Automation Description
No ratings yet
Cricket Score Python Automation Description
3 pages
正規化411210002
No ratings yet
正規化411210002
8 pages
USA Today - Pursuing The Network Strategy (HBS 402-010) Ch02
No ratings yet
USA Today - Pursuing The Network Strategy (HBS 402-010) Ch02
13 pages
Origin CFG
No ratings yet
Origin CFG
1 page
正規化411210002
No ratings yet
正規化411210002
8 pages
7 - Gamification in Teaching
No ratings yet
7 - Gamification in Teaching
12 pages
HW1
No ratings yet
HW1
2 pages
Thesis For Certificate of English Competency: Calistrat Hogas Arts and Sciences High School
No ratings yet
Thesis For Certificate of English Competency: Calistrat Hogas Arts and Sciences High School
50 pages
Department of Electrical Engineering School of Science and Engineering EE514/CS535 Machine Learning Homework 1
No ratings yet
Department of Electrical Engineering School of Science and Engineering EE514/CS535 Machine Learning Homework 1
11 pages
download
No ratings yet
download
2 pages
CS PH PH103. Hein - M DD 2018 2
100% (1)
CS PH PH103. Hein - M DD 2018 2
5 pages
Abu Minhaj Farooqi 37560 Ai Lab Final Exam
No ratings yet
Abu Minhaj Farooqi 37560 Ai Lab Final Exam
14 pages
ML Project
No ratings yet
ML Project
10 pages
Experiment1111
No ratings yet
Experiment1111
25 pages
Opti Output
No ratings yet
Opti Output
6 pages
DEEPAK
No ratings yet
DEEPAK
6 pages
Colleges in A.P
No ratings yet
Colleges in A.P
66 pages
multi-arm-bandit problem
No ratings yet
multi-arm-bandit problem
11 pages
L2 Projection Piecewise
No ratings yet
L2 Projection Piecewise
9 pages
Hammer NumericalIntegrationSimplexes 1956
No ratings yet
Hammer NumericalIntegrationSimplexes 1956
9 pages
Dream Team
No ratings yet
Dream Team
4 pages
Player
No ratings yet
Player
2 pages
Praveen S K Resume Updated
No ratings yet
Praveen S K Resume Updated
4 pages
outputCode (1)
No ratings yet
outputCode (1)
2 pages
ATUL MLT EXP 4-11
No ratings yet
ATUL MLT EXP 4-11
17 pages
Gauss Legendre Quadrature Over A Triangle
No ratings yet
Gauss Legendre Quadrature Over A Triangle
7 pages
assgmt1
No ratings yet
assgmt1
7 pages
Argha's ML LAB_240927_121838
No ratings yet
Argha's ML LAB_240927_121838
13 pages
Assignment EE5179 ME20B145 Report
No ratings yet
Assignment EE5179 ME20B145 Report
6 pages
Essential Oils1
100% (1)
Essential Oils1
6 pages
032 EEE135 Out
No ratings yet
032 EEE135 Out
2 pages
EE 559 HW2Code PDF
No ratings yet
EE 559 HW2Code PDF
7 pages
SRM Eswari Workshop Day 1 - Feb 2025 - Jupyter Notebook
No ratings yet
SRM Eswari Workshop Day 1 - Feb 2025 - Jupyter Notebook
39 pages
CS6700 RL 2024 Wa1
No ratings yet
CS6700 RL 2024 Wa1
7 pages
DELIMITATION
No ratings yet
DELIMITATION
4 pages
HW2_110306073.ipynb - Colaboratory
No ratings yet
HW2_110306073.ipynb - Colaboratory
3 pages
Australia Awards Sri-Lanka
No ratings yet
Australia Awards Sri-Lanka
4 pages
Research Methodology
No ratings yet
Research Methodology
41 pages
CVDL(Practical No. 3)
No ratings yet
CVDL(Practical No. 3)
1 page
Quadrature Rules For Numerical Integration Over Triangles and Tetrahedra
No ratings yet
Quadrature Rules For Numerical Integration Over Triangles and Tetrahedra
3 pages
perceptron-numpy
No ratings yet
perceptron-numpy
3 pages
Benzene Chlorobenzene VLE Data
No ratings yet
Benzene Chlorobenzene VLE Data
8 pages
1 - All Python Codes + Neo4j Samples
No ratings yet
1 - All Python Codes + Neo4j Samples
16 pages
Heat Exchangers: The Effectiveness - NTU Method: Sections 11.4 Through 11.7
No ratings yet
Heat Exchangers: The Effectiveness - NTU Method: Sections 11.4 Through 11.7
15 pages
Lab. 6 Buffer Solutions
100% (1)
Lab. 6 Buffer Solutions
4 pages
Standards For Language Learning
No ratings yet
Standards For Language Learning
2 pages
The Twenty Five Card Trick
No ratings yet
The Twenty Five Card Trick
6 pages
Triangle Quadratureby Mapping
No ratings yet
Triangle Quadratureby Mapping
2 pages
Data - Preprocessing - Tools - Ipynb - Colaboratory
No ratings yet
Data - Preprocessing - Tools - Ipynb - Colaboratory
4 pages
DEL MAA: Rahul / Rahul MR AI0538
No ratings yet
DEL MAA: Rahul / Rahul MR AI0538
1 page
DLP in Eng 6 Cause and Effect
No ratings yet
DLP in Eng 6 Cause and Effect
10 pages
Name Saskia Meaning, Origin Etc. - Girl Names - B
No ratings yet
Name Saskia Meaning, Origin Etc. - Girl Names - B
1 page
De Moiver's Theorem (Trigonometry) Mathematics Question Bank
From Everand
De Moiver's Theorem (Trigonometry) Mathematics Question Bank
Mohmmad Khaja Shareef
No ratings yet
Inverse Trigonometric Functions (Trigonometry) Mathematics Question Bank
From Everand
Inverse Trigonometric Functions (Trigonometry) Mathematics Question Bank
Mohmmad Khaja Shareef
No ratings yet

Note: This service is not intended for secure transactions such as banking, social media, email, or purchasing. Use at your own risk. We assume no liability whatsoever for broken pages.

Q1.ipynb - Colab

Uploaded by

Q1.ipynb - Colab

Uploaded by

5/12/24, 8:36 AM Q1.

4.189999999999989 2660.071000000038 70547.89999999957 292 7 0.17612314224243164

You might also like

Pfad - The Proxy pFad of © 2024 Garber Painting. All rights reserved.