0% found this document useful (0 votes)

21 views21 pages

DARecord

Data Analytics Record JNTUH

Uploaded by

A0565

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

21 views21 pages

DARecord

Data Analytics Record JNTUH

Uploaded by

A0565

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 21

1.

Demonstrate data cleaning – missing values

library(tidyverse)
x <- sample(1:21, 20, replace = TRUE)
y <- sample(1:10, 20, replace = TRUE)
for(i in 1:20)
{
a <- x[i]
b <- y[i]
mtcars[a, b] = NA
}
which(is.na(mtcars))
sum(is.na(mtcars))
na.exclude(mtcars)
view(mtcars)
dispna <- apply(mtcars["disp"], 2, mean, na.rm=TRUE)
view(dispna)
newcars <- mtcars %>%
mutate(disp = ifelse(is.na(disp), dispna, disp), )
view(newcars)

Output
> which(is.na(mtcars))
[1] 1 10 33 37 42 48 66 69 73 76 77 85 101 105 112 115 116 136 149 16
2 170 171
[23] 174 175 193 194 196 203 206 213 239 245 261 290 298 305

> sum(is.na(mtcars))
[1] 36

1
> na.exclude(mtcars)
mpg cyl disp hp drat wt qsec vs am gear carb
Datsun 710 22.8 4 108.0 93 3.85 2.320 18.61 1 1 4 1
Valiant 18.1 6 225.0 105 2.76 3.460 20.22 1 0 3 1
Duster 360 14.3 8 360.0 245 3.21 3.570 15.84 0 0 3 4
Fiat 128 32.4 4 78.7 66 4.08 2.200 19.47 1 1 4 1
Dodge Challenger 15.5 8 318.0 150 2.76 3.520 16.87 0 0 3 2
AMC Javelin 15.2 8 304.0 150 3.15 3.435 17.30 0 0 3 2
Camaro Z28 13.3 8 350.0 245 3.73 3.840 15.41 0 0 3 4
Pontiac Firebird 19.2 8 400.0 175 3.08 3.845 17.05 0 0 3 2
Fiat X1-9 27.3 4 79.0 66 4.08 1.935 18.90 1 1 4 1
Porsche 914-2 26.0 4 120.3 91 4.43 2.140 16.70 0 1 5 2
Lotus Europa 30.4 4 95.1 113 3.77 1.513 16.90 1 1 5 2
Ford Pantera L 15.8 8 351.0 264 4.22 3.170 14.50 0 1 5 4
Ferrari Dino 19.7 6 145.0 175 3.62 2.770 15.50 0 1 5 6
Maserati Bora 15.0 8 301.0 335 3.54 3.570 14.60 0 1 5 8
Volvo 142E 21.4 4 121.0 109 4.11 2.780 18.60 1 1 4 2

2
2. Implement data normalization (min-max, z-score)
arr <- c(9.5, 6.2, 8.9, 15.2, 20.0, 10.1, 5.4, 3.2, 1.0, 22.5, 10.0, 16.0)
#min-max
minarr <- min(arr)
maxarr <- max(arr)
arr2 <- arr
for (i in 1:12){
arr2[i] = round((arr[i]-minarr)/(maxarr-minarr))
}
print(arr2)

#z-score
meanarr <- mean(arr)
sdarr <- sd(arr)
for (i in 1:12){
arr2[i] = round((arr[i]-meanarr)/sdarr, 2)
}
print(arr2)

Output:
> print(arr2)
[1] 0 0 0 1 1 0 0 0 0 1 0 1
>
> #z-score
> meanarr <- mean(arr)
> sdarr <- sd(arr)
> for (i in 1:12){
+ arr2[i] = round((arr[i]-meanarr)/sdarr, 2)
+}
> print(arr2)
[1] -0.18 -0.68 -0.27 0.69 1.42 -0.09 -0.80 -1.13 -1.47 1.79 -0.10 0.81

3
3. Implement attribute subset selection for data reduc
tion
view(Titanic)
sum(is.na(Titanic))
Titanic = Titanic %>%
na.omit()
dim(Titanic)
fwd = regsubsets(Freq~., data = Titanic, nvmax = 19, method = "forward")
bwd = regsubsets(Freq~., data = Titanic, nvmax = 19, method = "backward")
full = regsubsets(Freq~., data = Titanic, nvmax = 19)
summary(fwd)
summary(bwd)
summary(full)
coef(fwd, 3)
coef(bwd, 3)
coef(full, 3)

Output:
> summary(fwd)
Subset selection object
Call: regsubsets.formula(Freq ~ ., data = Titanic, nvmax = 19, method = "forward")
6 Variables (and intercept)
Forced in Forced out
Class2nd FALSE FALSE
Class3rd FALSE FALSE
ClassCrew FALSE FALSE
SexFemale FALSE FALSE
AgeAdult FALSE FALSE
SurvivedYes FALSE FALSE
1 subsets of each size up to 6
Selection Algorithm: forward
Class2nd Class3rd ClassCrew SexFemale AgeAdult SurvivedYes
1 (1)"" "" "" "" "*" " "

4
2 (1)"" "" "" "*" "*" " "
3 (1)"" "" "" "*" "*" "*"
4 (1)"" " " "*" "*" "*" "*"
5 (1)"" "*" "*" "*" "*" "*"
6 ( 1 ) "*" "*" "*" "*" "*" "*"

> summary(bwd)
Subset selection object
Call: regsubsets.formula(Freq ~ ., data = Titanic, nvmax = 19, method = "backward")
6 Variables (and intercept)
Forced in Forced out
Class2nd FALSE FALSE
Class3rd FALSE FALSE
ClassCrew FALSE FALSE
SexFemale FALSE FALSE
AgeAdult FALSE FALSE
SurvivedYes FALSE FALSE
1 subsets of each size up to 6
Selection Algorithm: backward
Class2nd Class3rd ClassCrew SexFemale AgeAdult SurvivedYes
1 (1)"" "" "" "" "*" " "
2 (1)"" "" "" "*" "*" " "
3 (1)"" "" "" "*" "*" "*"
4 ( 1 ) " " " " "*" "*" "*" "*"
5 ( 1 ) " " "*" "*" "*" "*" "*"
6 ( 1 ) "*" "*" "*" "*" "*" "*"

> summary(full)
Subset selection object
Call: regsubsets.formula(Freq ~ ., data = Titanic, nvmax = 19)
6 Variables (and intercept)
Forced in Forced out
Class2nd FALSE FALSE
Class3rd FALSE FALSE
ClassCrew FALSE FALSE
SexFemale FALSE FALSE
AgeAdult FALSE FALSE
SurvivedYes FALSE FALSE
1 subsets of each size up to 6
Selection Algorithm: exhaustive

5
Class2nd Class3rd ClassCrew SexFemale AgeAdult SurvivedYes
1 (1)"" "" "" "" "*" " "
2 (1)"" "" "" "*" "*" " "
3 (1)"" "" "" "*" "*" "*"
4 ( 1 ) " " " " "*" "*" "*" "*"
5 ( 1 ) " " "*" "*" "*" "*" "*"
6 ( 1 ) "*" "*" "*" "*" "*" "*"
>
> coef(fwd, 3)
(Intercept) SexFemale AgeAdult SurvivedYes
70.5625 -78.8125 123.9375 -48.6875
> coef(bwd, 3)
(Intercept) SexFemale AgeAdult SurvivedYes
70.5625 -78.8125 123.9375 -48.6875
> coef(full, 3)
(Intercept) SexFemale AgeAdult SurvivedYes
70.5625 -78.8125 123.9375 -48.6875
>

6
4. Demonstrate outlier detection
view(day)
sum(is.na(day))
boxplot(day[, c("temp", "hum", "windspeed")])
for( i in c("hum", "windspeed"))
{
data <- unlist(day[i])
newData <- data[data %in% boxplot.stats(data)$out]
data[data %in% newData] = NA
day[i] = data
}
sum(is.na(data))
day = drop_na(day)
boxplot(day[, c("temp", "hum", "windspeed")])

7
Output:

8
5. Perform analytics on any standard data set
library(tidyverse)
head(titanic)
sapply(titanic, class)
titanic$Sex = as.factor(titanic$Sex)
titanic$Survived = as.factor(titanic$Survived)
summary(titanic)
dropnull_titanic = titanic[rowSums(is.na(titanic)) <= 0, ]
survivedList = dropnull_titanic[dropnull_titanic$Survived == 1 , ]
notSurvivedList = dropnull_titanic[dropnull_titanic$Survived == 0, ]
mytable <- table(titanic$Survived)
lbls <- paste(names(titanic), "\n", mytable, sep = "")
pie(
mytable,
labels = lbls,
main = "pie chart"
)
hist(titanic$Age, xlab = "gender", ylab = "frequency")
barplot(table(notSurvivedList$Sex), xlab = "gender", ylab = "frequency")
temp <- density(table(survivedList$Fare))
plot(temp, type = "n", main = "fare charged")
polygon(temp, col = "lightgray", border = "gray")
boxplot(titanic$Fare, main = "fare")

9
# A tibble: 6 × 12
PassengerId Survived Pclass Name Sex Age SibSp Parch Ticket Fare Ca
bin Embarked
<dbl> <fct> <dbl> <chr> <fct> <dbl> <dbl> <dbl> <chr> <dbl> <chr> <
chr>
1 892 0 3 Kelly, Mr. J… male 34.5 0 0 330911 7.83 NA Q
2 893 1 3 Wilkes, Mrs.… fema… 47 1 0 363272 7 NA S
3 894 0 2 Myles, Mr. T… male 62 0 0 240276 9.69 NA Q
4 895 0 3 Wirz, Mr. Al… male 27 0 0 315154 8.66 NA S
5 896 1 3 Hirvonen, Mr… fema… 22 1 1 31012… 12.3 NA S
6 897 0 3 Svensson, Mr… male 14 0 0 7538 9.22 NA S
> sapply(titanic, class)
PassengerId Survived Pclass Name Sex Age SibSp
"numeric" "factor" "numeric" "character" "factor" "numeric" "numeric"
Parch Ticket Fare Cabin Embarked
"numeric" "character" "numeric" "character" "character"
> summary(titanic)
PassengerId Survived Pclass Name Sex Age
Min. : 892.0 0:266 Min. :1.000 Length:418 female:152 Min. : 0.17
1st Qu.: 996.2 1:152 1st Qu.:1.000 Class :character male :266 1st Qu.:21
.00
Median :1100.5 Median :3.000 Mode :character Median :27.0
0
Mean :1100.5 Mean :2.266 Mean :30.27
3rd Qu.:1204.8 3rd Qu.:3.000 3rd Qu.:39.00
Max. :1309.0 Max. :3.000 Max. :76.00
NA's :86
SibSp Parch Ticket Fare Cabin
Min. :0.0000 Min. :0.0000 Length:418 Min. : 0.000 Length:418
1st Qu.:0.0000 1st Qu.:0.0000 Class :character 1st Qu.: 7.896 Class :chara
cter
Median :0.0000 Median :0.0000 Mode :character Median : 14.454 Mode
:character
Mean :0.4474 Mean :0.3923 Mean : 35.627
3rd Qu.:1.0000 3rd Qu.:0.0000 3rd Qu.: 31.500
Max. :8.0000 Max. :9.0000 Max. :512.329
NA's :1
Embarked
Length:418
Class :character

10
Mode :character

11
6. Implement linear regression
data <- data.frame(
Years_Exp = c(1.1, 1.3, 1.5, 2.0, 2.2, 2.9, 3.0, 3.2, 3.2, 3.7),
Salary = c(39343.00, 46205.00, 37731.00, 43525.00,
39891.00, 56642.00, 60150.00, 54445.00, 64445.00, 57189.00)
)
library(caTools)
split = sample.split(data$Salary, SplitRatio = 0.7)
train = subset(data, split == TRUE)
test = subset(data, split == FALSE)
lm.r = lm(formula = Salary ~ Years_Exp, data = train)
coef(lm.r)
ggplot() + geom_point(aes(x = train$Years_Exp, y = train$Salary), col = 'red') +
geom_line(aes(x = train$Years_Exp, y = predict(lm.r, data = train)), col = "blue")
+ ggtitle("salary vs experience")

Output:
(Intercept) Years_Exp
29172.310 8922.322

12
7. Implement logistic regression
library(tidyverse)
library(ROCR)
library(caTools)
view(mtcars)
split <- sample.split(mtcars, SplitRatio = 0.8)
train <- subset(mtcars, split == "TRUE")
test <- subset(mtcars, split == "FALSE")

logistic_model <- glm(vs ~ wt + disp, data = train, family = binomial)

summary(logistic_model)

predict_reg <- predict(logistic_model, test, type = "response")

predict_reg

predict_reg <- ifelse(predict_reg >0.5, 1, 0)

table(test$vs, predict_reg)

missing_classerr <- mean(predict_reg != test$vs)

missing_classerr
print(paste("accuracy = ", (1 - missing_classerr)))

library(ggplot2)

#plot logistic regression curve

ggplot(mtcars, aes(x=wt + disp, y=vs)) +

13
geom_point(alpha=.5) +
stat_smooth(method="glm", se=FALSE, method.args = list(family=binomial),
col="red")
library(ROCR)
ROCPred = prediction(predict_reg, test$vs)
ROCPer = performance(ROCPred, measure = "tpr", x.measure = "fpr")
auc <- performance(ROCPred, measure = "auc")
auc <- auc@y.values[[1]]
auc
plot(ROCPer, colorize=TRUE, print.cutoffs.at = seq(0.1, by = 0.1), main = "ROC
Curve")
abline(a = 0, b = 1)

auc <- round(auc, 4)

legend(.6, .4, auc, title="AUC", cex = 1)

Output
Call:
glm(formula = vs ~ wt + disp, family = binomial, data = train)

Coefficients:
Estimate Std. Error z value Pr(>|z|)
(Intercept) 2.79114 2.96489 0.941 0.347
wt 0.85989 1.55388 0.553 0.580
disp -0.02718 0.01456 -1.866 0.062 .
---
Signif. codes: 0 ‘***’ 0.001 ‘**’ 0.01 ‘*’ 0.05 ‘.’ 0.1 ‘ ’ 1

(Dispersion parameter for binomial family taken to be 1)

Null deviance: 31.841 on 22 degrees of freedom

Residual deviance: 17.188 on 20 degrees of freedom

14
AIC: 23.188

Number of Fisher Scoring iterations: 6

>
> predict_reg <- predict(logistic_model, test, type = "response")
> predict_reg
Datsun 710 Hornet Sportabout Merc 230 Merc 450SLC
0.864210634 0.017371341 0.841966715 0.189302645
Lincoln Continental Toyota Corolla Pontiac Firebird Porsche 914-2
0.006385438 0.919574847 0.008373046 0.796023875
Maserati Bora
0.089476536
>
> predict_reg <- ifelse(predict_reg >0.5, 1, 0)
>
> table(test$vs, predict_reg)
predict_reg
01
051
103
>
> missing_classerr <- mean(predict_reg != test$vs)
> missing_classerr
[1] 0.1111111
> print(paste("accuracy = ", (1 - missing_classerr)))
[1] "accuracy = 0.888888888888889"
>
> library(ggplot2)
>
> #plot logistic regression curve
> ggplot(mtcars, aes(x=wt + disp, y=vs)) +
+ geom_point(alpha=.5) +
+ stat_smooth(method="glm", se=FALSE, method.args = list(family=binomial),
+ col="red")
`geom_smooth()` using formula = 'y ~ x'
> auc
[1] 0.9166667

15
16
8. Construct decision tree for weather data set
sample = sample(c(TRUE, FALSE), nrow(weatherdata), replace = TRUE, prob = c
(0.8, 0.2))

train <- weatherdata[sample, ]

test <- weatherdata[!sample, ]

library(partykit)
model <- ctree(RainTomorrow ~ ., train)
plot(model)

predict_model <- predict(model, test)

predict_model

mat <- table(test$RainTomorrow, predict_model)

mat

accuracy <- sum(diag(mat)) / sum(mat)

accuracy

Output:
predict_model
0.0478723404255319 0.175 0.625
0 52 10 5
1 7 4 4
>
> accuracy <- sum(diag(mat)) / sum(mat)
> accuracy
[1] 0.6829268

17
9. Analyse time-series data

positiveCases <- c(580, 7813, 28266, 59287,75700, 87820, 95314, 126214,

218843, 471497, 936851,1508725, 2072113)
deaths <- c(17, 270, 565, 1261, 2126, 2800,
3285, 4628, 8951, 21283, 47210,
88480, 138475)
library(lubridate)
# output to be created as png file
png(file="multivariateTimeSeries.png")
# creating multivariate time series object
# from date 22 January, 2020
mts <- ts(cbind(positiveCases, deaths),
start = decimal_date(ymd("2020-01-22")),
frequency = 365.25 / 7)
# plotting the graph
plot(mts, xlab ="Weekly Data",
main ="COVID-19 Cases",
col.main ="darkgreen")
library(forecast)
library(lubridate)
png(file = "timeseries.png")
mts1 <- ts(positiveCases, decimal_date(ymd("2020-01-22")), frequency =
365.25/7)
fit <- auto.arima(mts1)
fit <- forecast(fit, 5)

18
plot(forecast(fit, 5), xlab="weekly data", ylab = "positive cases", main = "COVID
19", col.main = "green")

dev.off()

Output:

19
10. Work on any data visualization tool
view(airquality)
barplot(airquality$Ozone,
main = 'Ozone Concenteration in air',
xlab = 'ozone levels', horiz = TRUE)
hist(airquality$Temp, main ="La Guardia Airport's\
Maximum Temperature(Daily)",
xlab ="Temperature(Fahrenheit)",
xlim = c(50, 125), col ="yellow",
freq = TRUE)
boxplot(airquality[, 0:4],
main ='Box Plots for Air Quality Parameters')
plot(airquality$Ozone, airquality$Month,
main ="Scatterplot Example",
xlab ="Ozone Concentration in parts per billion",
ylab =" Month of observation ", pch = 19)
data <- matrix(rnorm(50, 0, 5), nrow = 5, ncol = 5)

# Column names
colnames(data) <- paste0("col", 1:5)
rownames(data) <- paste0("row", 1:5)

# Draw a heatmap
heatmap(data)

20
Output

6 Hobbies That Can Build Up Your Creativity and Imagination
No ratings yet
6 Hobbies That Can Build Up Your Creativity and Imagination
1 page
GE Practical Sem 2
No ratings yet
GE Practical Sem 2
28 pages
How Smart Machines Think
From Everand
How Smart Machines Think
Sean Gerrish
3.5/5 (7)
Lec 18
No ratings yet
Lec 18
17 pages
Smart Assistive Multi Final
No ratings yet
Smart Assistive Multi Final
11 pages
Data Preprocessing - 241024 - 215531
No ratings yet
Data Preprocessing - 241024 - 215531
40 pages
Data Science Practicals
No ratings yet
Data Science Practicals
47 pages
Statistic and R Programming Lab Exercise
No ratings yet
Statistic and R Programming Lab Exercise
24 pages
Filter Based Feature Selection Using ANOVA: Suppose A Company Wants To Analyze Whether The
No ratings yet
Filter Based Feature Selection Using ANOVA: Suppose A Company Wants To Analyze Whether The
66 pages
Mayank Chaudhary DEV Practicals
No ratings yet
Mayank Chaudhary DEV Practicals
14 pages
Statistic and R Programming Lab Exercise
No ratings yet
Statistic and R Programming Lab Exercise
8 pages
Shamsundar M2 Project2
50% (2)
Shamsundar M2 Project2
14 pages
Assignment 1
No ratings yet
Assignment 1
16 pages
AE II Simulation File PDF
No ratings yet
AE II Simulation File PDF
32 pages
Dharma Fiber Reactive Procion Dyes
No ratings yet
Dharma Fiber Reactive Procion Dyes
1 page
Practical - Questions - Unit 1 and 2
No ratings yet
Practical - Questions - Unit 1 and 2
5 pages
Data Cleaning
No ratings yet
Data Cleaning
4 pages
(Practical) Programming With R
No ratings yet
(Practical) Programming With R
5 pages
Pointers To Review On Mathematics
No ratings yet
Pointers To Review On Mathematics
3 pages
Lecture 5
No ratings yet
Lecture 5
27 pages
R All Program
No ratings yet
R All Program
10 pages
DAV Practical File 234003
No ratings yet
DAV Practical File 234003
14 pages
Cat Global Catalog Loctite
100% (1)
Cat Global Catalog Loctite
47 pages
Resume BE Nodejs Dovanthanh English
No ratings yet
Resume BE Nodejs Dovanthanh English
2 pages
Project Paarth
No ratings yet
Project Paarth
21 pages
Lecture 1
No ratings yet
Lecture 1
43 pages
01 - Feature Engg
No ratings yet
01 - Feature Engg
43 pages
DAV Practicle File
No ratings yet
DAV Practicle File
28 pages
Homework 1
No ratings yet
Homework 1
17 pages
Active Driveline
No ratings yet
Active Driveline
17 pages
Data Wrangling
No ratings yet
Data Wrangling
12 pages
Tender - GCMS Specification
No ratings yet
Tender - GCMS Specification
5 pages
Httpssimplifydays.s3.Us West 2.amazonaws - Comsimplifybook Video4 PDF
No ratings yet
Httpssimplifydays.s3.Us West 2.amazonaws - Comsimplifybook Video4 PDF
7 pages
Situation Infancy Mortality
No ratings yet
Situation Infancy Mortality
2 pages
Theory of Literature
No ratings yet
Theory of Literature
5 pages
DAV Practicals
No ratings yet
DAV Practicals
26 pages
CSE1703 - Fundamental of Data Science
No ratings yet
CSE1703 - Fundamental of Data Science
6 pages
Practical Assignment4 1
No ratings yet
Practical Assignment4 1
6 pages
DSE 2151 24 Sep 2022
No ratings yet
DSE 2151 24 Sep 2022
5 pages
DMPM-LAB-04-Assignment: Rcode
No ratings yet
DMPM-LAB-04-Assignment: Rcode
11 pages
Manishadav
No ratings yet
Manishadav
27 pages
What Are Decision Trees?
No ratings yet
What Are Decision Trees?
9 pages
Kelbie Davidson (44817015) COMP4702 - Assignment 1
No ratings yet
Kelbie Davidson (44817015) COMP4702 - Assignment 1
7 pages
Control Room - Updated 18th May PDF
No ratings yet
Control Room - Updated 18th May PDF
1 page
Stastistics and Probability With R Programming Language: Lab Report
50% (2)
Stastistics and Probability With R Programming Language: Lab Report
44 pages
SPECIMEN EXAM SOLUTIONS - CS1B - IFoA - 2019 - Final
No ratings yet
SPECIMEN EXAM SOLUTIONS - CS1B - IFoA - 2019 - Final
8 pages
Chapter 2 - of The Principles of Business Book
No ratings yet
Chapter 2 - of The Principles of Business Book
55 pages
IS328 Data Mining-Tutorial Lab Session 2 - Solution - Updated
No ratings yet
IS328 Data Mining-Tutorial Lab Session 2 - Solution - Updated
15 pages
Dal Programs With Output
No ratings yet
Dal Programs With Output
11 pages
PML Ex3
No ratings yet
PML Ex3
20 pages
SA 226 LUBRICATION - Maintenance Practices
No ratings yet
SA 226 LUBRICATION - Maintenance Practices
12 pages
Eng 2015 Prelims Reviewer
No ratings yet
Eng 2015 Prelims Reviewer
11 pages
Practical 10
No ratings yet
Practical 10
22 pages
Guidelines DAVP
No ratings yet
Guidelines DAVP
3 pages
Data Mining Lab 03
No ratings yet
Data Mining Lab 03
10 pages
Lab1: Introduction To R: Islr2
No ratings yet
Lab1: Introduction To R: Islr2
10 pages
Business Analytics-1: STR (Crew - Data)
No ratings yet
Business Analytics-1: STR (Crew - Data)
16 pages
Rack and Tower Sap Certifications
No ratings yet
Rack and Tower Sap Certifications
5 pages
Koskela en Es
No ratings yet
Koskela en Es
298 pages
Blood Bank 3
No ratings yet
Blood Bank 3
14 pages
Essay
No ratings yet
Essay
7 pages
Aditya Garg DMDW
No ratings yet
Aditya Garg DMDW
40 pages
Guidelines For Academic Writing
No ratings yet
Guidelines For Academic Writing
8 pages
Trusted Link Installation Guide
No ratings yet
Trusted Link Installation Guide
19 pages
Final Cost Practical
No ratings yet
Final Cost Practical
29 pages
Manipulating Data With STATA
No ratings yet
Manipulating Data With STATA
7 pages
Schedule MANPOWER TLD JAN. 2023
No ratings yet
Schedule MANPOWER TLD JAN. 2023
21 pages
"Rectbeam" - Rectangular Concrete Beam Analysis/Design: Program Description
No ratings yet
"Rectbeam" - Rectangular Concrete Beam Analysis/Design: Program Description
46 pages
Vamshi Krishna Resume
No ratings yet
Vamshi Krishna Resume
4 pages
Experiments Rlab Upto Cat - 1: Lab - 1 Introduction To R - Lab
No ratings yet
Experiments Rlab Upto Cat - 1: Lab - 1 Introduction To R - Lab
31 pages
R Studio Notes
No ratings yet
R Studio Notes
10 pages
PA00T62J
No ratings yet
PA00T62J
190 pages
SEP-OPE-OHSF1-SC03-00001 Ohaji South EPF Heater Treater Installation Project - FEED SOW - A01 - Signed
100% (1)
SEP-OPE-OHSF1-SC03-00001 Ohaji South EPF Heater Treater Installation Project - FEED SOW - A01 - Signed
36 pages
Meo Class I Assessment Process MMD Kochi-1
No ratings yet
Meo Class I Assessment Process MMD Kochi-1
10 pages
Stat A Tutorial
No ratings yet
Stat A Tutorial
40 pages
DAV Guidelines
No ratings yet
DAV Guidelines
4 pages
Bomag Bw120 Ad5 Kullanma Bakim
100% (1)
Bomag Bw120 Ad5 Kullanma Bakim
196 pages
Homework Index: To See If The Questions Have Been Changed, or If You Are Required To Use Different Data or Examples
No ratings yet
Homework Index: To See If The Questions Have Been Changed, or If You Are Required To Use Different Data or Examples
86 pages
Christian Dior The Magic of Fashion
100% (3)
Christian Dior The Magic of Fashion
66 pages
Braced Cuts
No ratings yet
Braced Cuts
62 pages
Python For Data Sceince l1 Hands On
No ratings yet
Python For Data Sceince l1 Hands On
5 pages
Date Preparation and Exploration:: Titanic Data - CSV
No ratings yet
Date Preparation and Exploration:: Titanic Data - CSV
5 pages
DAV Guidelines
No ratings yet
DAV Guidelines
4 pages
E-Tivity 2.2 Tharcisse 217010849
No ratings yet
E-Tivity 2.2 Tharcisse 217010849
7 pages
Sas Chapter 10 Asda Analysis Examples Replication Winter 2010 Sas
No ratings yet
Sas Chapter 10 Asda Analysis Examples Replication Winter 2010 Sas
7 pages
BREAK Character Sheet (Tam)
No ratings yet
BREAK Character Sheet (Tam)
1 page
Quiz Coding Question 1
No ratings yet
Quiz Coding Question 1
9 pages
Advanced C Concepts and Programming: First Edition
From Everand
Advanced C Concepts and Programming: First Edition
Gayatri
3/5 (1)
150+ JavaScript Pattern Programs
From Everand
150+ JavaScript Pattern Programs
Hernando Abella
No ratings yet
Analytic Geometry: Graphic Solutions Using Matlab Language
From Everand
Analytic Geometry: Graphic Solutions Using Matlab Language
Ing. Mario Castillo
No ratings yet

Note: This service is not intended for secure transactions such as banking, social media, email, or purchasing. Use at your own risk. We assume no liability whatsoever for broken pages.

DARecord

Uploaded by

DARecord

Uploaded by

1.

Demonstrate data cleaning – missing values

logistic_model <- glm(vs ~ wt + disp, data = train, family = binomial)

predict_reg <- predict(logistic_model, test, type = "response")

predict_reg <- ifelse(predict_reg >0.5, 1, 0)

missing_classerr <- mean(predict_reg != test$vs)

#plot logistic regression curve

auc <- round(auc, 4)

(Dispersion parameter for binomial family taken to be 1)

Null deviance: 31.841 on 22 degrees of freedom

Number of Fisher Scoring iterations: 6

train <- weatherdata[sample, ]

predict_model <- predict(model, test)

mat <- table(test$RainTomorrow, predict_model)

accuracy <- sum(diag(mat)) / sum(mat)

positiveCases <- c(580, 7813, 28266, 59287,75700, 87820, 95314, 126214,

You might also like

Pfad - The Proxy pFad of © 2024 Garber Painting. All rights reserved.