Добро пожаловать в Scribd!

Пропустить карусель

CH 5

Загружено:

Anonymous

0% нашли этот документ полезным (0 голосов)

73 просмотров3 страницы

Data for the related model

Оригинальное название

Ch5

Авторское право

Доступные форматы

TXT, PDF, TXT или читайте онлайн в Scribd

Поделиться этим документом

Поделиться или встроить документ

Параметры публикации

Этот документ был вам полезен?

Это неприемлемый материал?

Пожаловаться на этот документ

Data for the related model

Авторское право:

Доступные форматы

Скачайте в формате TXT, PDF, TXT или читайте онлайн в Scribd

Отметить как неприемлемый контент

0% нашли этот документ полезным (0 голосов)

73 просмотров3 страницы

CH 5

Загружено:

Anonymous

Data for the related model

Авторское право:

Доступные форматы

Скачайте в формате TXT, PDF, TXT или читайте онлайн в Scribd

Отметить как неприемлемый контент

Перейти к странице

Вы находитесь на странице: 1из 3

Поиск в документе

#### Table 5.

# package forecast is required to evaluate performance

library(forecast)

# load file
toyota.corolla.df <- read.csv("ToyotaCorolla.csv")

# randomly generate training and validation sets

training <- sample(toyota.corolla.df$Id, 600)
validation <- sample(setdiff(toyota.corolla.df$Id, training), 400)

# run linear regression model

reg <- lm(Price~., data=toyota.corolla.df[,-c(1,2,8,11)], subset=training,
na.action=na.exclude)
pred_t <- predict(reg, na.action=na.pass)
pred_v <- predict(reg, newdata=toyota.corolla.df[validation,-c(1,2,8,11)],
na.action=na.pass)

## evaluate performance
# training
accuracy(pred_t, toyota.corolla.df[training,]$Price)
# validation
accuracy(pred_v, toyota.corolla.df[validation,]$Price)

#### Figure 5.2

# remove missing Price data

toyota.corolla.df <-
toyota.corolla.df[!is.na(toyota.corolla.df[validation,]$Price),]

# generate random Training and Validation sets

training <- sample(toyota.corolla.df$Id, 600)
validation <- sample(toyota.corolla.df$Id, 400)

# regression model based on all numerical predictors

reg <- lm(Price~., data = toyota.corolla.df[,-c(1,2,8,11)], subset = training)

# predictions
pred_v <- predict(reg, newdata = toyota.corolla.df[validation,-c(1,2,8,11)])

# load package gains, compute gains (we will use package caret for categorical y
later)
library(gains)
gain <- gains(toyota.corolla.df[validation,]$Price[!is.na(pred_v)], pred_v[!
is.na(pred_v)])

# cumulative lift chart

options(scipen=999) # avoid scientific notation
# we will compute the gain relative to price
price <- toyota.corolla.df[validation,]$Price[!is.na(toyota.corolla.df[validation,]
$Price)]
plot(c(0,gain$cume.pct.of.total*sum(price))~c(0,gain$cume.obs),
xlab="# cases", ylab="Cumulative Price", main="Lift Chart", type="l")

# baseline
lines(c(0,sum(price))~c(0,dim(toyota.corolla.df[validation,])[1]), col="gray",
lty=2)

# Decile-wise lift chart

barplot(gain$mean.resp/mean(price), names.arg = gain$depth,
xlab = "Percentile", ylab = "Mean Response", main = "Decile-wise lift
chart")

#### Table 5.5

library(caret)
library(e1071)

owner.df <- read.csv("ownerExample.csv")

confusionMatrix(ifelse(owner.df$Probability>0.5, 'owner', 'nonowner'),
owner.df$Class)
confusionMatrix(ifelse(owner.df$Probability>0.25, 'owner', 'nonowner'),
owner.df$Class)
confusionMatrix(ifelse(owner.df$Probability>0.75, 'owner', 'nonowner'),
owner.df$Class)

#### Figure 5.4

# replace data.frame with your own

df <- read.csv("liftExample.csv")

# create empty accuracy table

accT = c()

# compute accuracy per cutoff

for (cut in seq(0,1,0.1)){
cm <- confusionMatrix(1 * (df$prob > cut), df$actual)
accT = c(accT, cm$overall[1])
}

# plot accuracy
plot(accT ~ seq(0,1,0.1), xlab = "Cutoff Value", ylab = "", type = "l", ylim = c(0,
1))
lines(1-accT ~ seq(0,1,0.1), type = "l", lty = 2)
legend("topright", c("accuracy", "overall error"), lty = c(1, 2), merge = TRUE)

#### Figure 5.5

library(pROC)
r <- roc(df$actual, df$prob)
plot.roc(r)

# compute auc
auc(r)
#### Figure 5.6

# first option with 'caret' library:

library(caret)
lift.example <- lift(relevel(as.factor(actual), ref="1") ~ prob, data = df)
xyplot(lift.example, plot = "gain")

# Second option with 'gains' library:

library(gains)
df <- read.csv("liftExample.csv")
gain <- gains(df$actual, df$prob, groups=dim(df)[1])
plot(c(0, gain$cume.pct.of.total*sum(df$actual)) ~ c(0, gain$cume.obs),
xlab = "# cases", ylab = "Cumulative", type="l")
lines(c(0,sum(df$actual))~c(0,dim(df)[1]), col="gray", lty=2)

#### Figure 5.7

# use gains() to compute deciles.

# when using the caret package, deciles must be computed manually.

gain <- gains(df$actual, df$prob)

barplot(gain$mean.resp / mean(df$actual), names.arg = gain$depth, xlab =
"Percentile",
ylab = "Mean Response", main = "Decile-wise lift chart")

Вам также может понравиться

Problem: # Partition
Документ5 страниц
Problem: # Partition
pavan adapala
Оценок пока нет
Why Good Matters Governance: Relevant Business Knowledge
Документ78 страниц
Why Good Matters Governance: Relevant Business Knowledge
prameyak1
100% (1)
Concept Based Practice Questions for Tableau Desktop Specialist Certification Latest Edition 2023
От Everand
Concept Based Practice Questions for Tableau Desktop Specialist Certification Latest Edition 2023
Exam OG
Оценок пока нет
ForecastMETHODS TECHNIQUES
Документ116 страниц
ForecastMETHODS TECHNIQUES
Venkata Nelluri Pmp
100% (1)
Anlyse Mine UnstructeredData@SocialMedia
Документ80 страниц
Anlyse Mine UnstructeredData@SocialMedia
Venkata Nelluri Pmp
100% (1)
BookSlides 5B Similarity Based Learning
Документ69 страниц
BookSlides 5B Similarity Based Learning
Mba Nani
Оценок пока нет
Supply Chain Execution Predictive Analytics Second Edition
От Everand
Supply Chain Execution Predictive Analytics Second Edition
Gerardus Blokdyk
Оценок пока нет
AI Testing A Complete Guide - 2021 Edition
От Everand
AI Testing A Complete Guide - 2021 Edition
Gerardus Blokdyk
Оценок пока нет
Price optimization A Clear and Concise Reference
От Everand
Price optimization A Clear and Concise Reference
Gerardus Blokdyk
Оценок пока нет
Sales Predictive Analytics Standard Requirements
От Everand
Sales Predictive Analytics Standard Requirements
Gerardus Blokdyk
Оценок пока нет
Chapter 14 - Cluster Analysis: Data Mining For Business Intelligence
Документ31 страница
Chapter 14 - Cluster Analysis: Data Mining For Business Intelligence
jay
Оценок пока нет
Pro Power BI Theme Creation: JSON Stylesheets for Automated Dashboard Formatting
От Everand
Pro Power BI Theme Creation: JSON Stylesheets for Automated Dashboard Formatting
Adam Aspin
Оценок пока нет
Making Sense of Data I: A Practical Guide to Exploratory Data Analysis and Data Mining
От Everand
Making Sense of Data I: A Practical Guide to Exploratory Data Analysis and Data Mining
Glenn J. Myatt
Оценок пока нет
Salary Prediction LinearRegression
Документ7 страниц
Salary Prediction LinearRegression
Yagnesh Vyas
100% (1)
Single customer view Second Edition
От Everand
Single customer view Second Edition
Gerardus Blokdyk
Оценок пока нет
Spark SQL A Complete Guide
От Everand
Spark SQL A Complete Guide
Gerardus Blokdyk
Оценок пока нет
Assignment 3
Документ5 страниц
Assignment 3
Ben Belanger
Оценок пока нет
Two-Tier ERP Strategy A Clear and Concise Reference
От Everand
Two-Tier ERP Strategy A Clear and Concise Reference
Gerardus Blokdyk
Оценок пока нет
Linear Regression PDF
Документ16 страниц
Linear Regression PDF
api-540582672
100% (1)
Mastering Parallel Programming with R
От Everand
Mastering Parallel Programming with R
Simon R. Chapple
Оценок пока нет
Data Catalog Third Edition
От Everand
Data Catalog Third Edition
Gerardus Blokdyk
Оценок пока нет
Solutions Manual to Accompany Introduction to Quantitative Methods in Business: with Applications Using Microsoft Office Excel
От Everand
Solutions Manual to Accompany Introduction to Quantitative Methods in Business: with Applications Using Microsoft Office Excel
Bharat Kolluri
Оценок пока нет
Analysis of variance Third Edition
От Everand
Analysis of variance Third Edition
Gerardus Blokdyk
Оценок пока нет
Customer Data and Analysis Second Edition
От Everand
Customer Data and Analysis Second Edition
Gerardus Blokdyk
Оценок пока нет
Getting Started with Dynamics NAV 2013 Application Development
От Everand
Getting Started with Dynamics NAV 2013 Application Development
Alex Chow
Оценок пока нет
(Excerpts From) Investigating Performance: Design and Outcomes With Xapi
От Everand
(Excerpts From) Investigating Performance: Design and Outcomes With Xapi
Janet Laane Effron
Оценок пока нет
Workforce Analysis A Complete Guide - 2020 Edition
От Everand
Workforce Analysis A Complete Guide - 2020 Edition
Gerardus Blokdyk
Оценок пока нет
Advanced Analytics for Government The Ultimate Step-By-Step Guide
От Everand
Advanced Analytics for Government The Ultimate Step-By-Step Guide
Gerardus Blokdyk
Оценок пока нет
Data Preparation
Документ87 страниц
Data Preparation
jessie nando
100% (1)
Program Data Mining With Business Analytics PDF
Документ5 страниц
Program Data Mining With Business Analytics PDF
Antonio Alvarez
Оценок пока нет
Data Visualization: Tutorial Dr. John F. Tripp
Документ51 страница
Data Visualization: Tutorial Dr. John F. Tripp
preeti agarwal
Оценок пока нет
Cell2Cell Data Documentation
Документ2 страницы
Cell2Cell Data Documentation
Jayesh Patil
Оценок пока нет
Introduction To AI IBM (COURSERA)
Документ2 страницы
Introduction To AI IBM (COURSERA)
Ritika Mondal
Оценок пока нет
Data curation The Ultimate Step-By-Step Guide
От Everand
Data curation The Ultimate Step-By-Step Guide
Gerardus Blokdyk
Оценок пока нет
Data Governance and Data Management: Contextualizing Data Governance Drivers, Technologies, and Tools
От Everand
Data Governance and Data Management: Contextualizing Data Governance Drivers, Technologies, and Tools
Rupa Mahanti
Оценок пока нет
exploratory data analysis A Complete Guide - 2019 Edition
От Everand
exploratory data analysis A Complete Guide - 2019 Edition
Gerardus Blokdyk
Оценок пока нет
A Comparative Study of Classification Methods in Data Mining Using RapidMiner Studio
Документ6 страниц
A Comparative Study of Classification Methods in Data Mining Using RapidMiner Studio
mishranamit2211
100% (1)
Final Reduced Objective Allowable Allowable Cell Name Value Cost Coefficient Increase Decrease
Документ7 страниц
Final Reduced Objective Allowable Allowable Cell Name Value Cost Coefficient Increase Decrease
Deepanshu Raj
Оценок пока нет
MSTC Final Exam 2017
Документ13 страниц
MSTC Final Exam 2017
Elis Komariah
Оценок пока нет
Gradient Descent - Linear Regression
Документ47 страниц
Gradient Descent - Linear Regression
Raushan Kashyap
100% (1)
Introduction to Machine Learning in the Cloud with Python: Concepts and Practices
От Everand
Introduction to Machine Learning in the Cloud with Python: Concepts and Practices
Pramod Gupta
Оценок пока нет
My SQL For Beginners
Документ3 страницы
My SQL For Beginners
Pallavi Singh
Оценок пока нет
Data Marts A Complete Guide - 2021 Edition
От Everand
Data Marts A Complete Guide - 2021 Edition
Gerardus Blokdyk
Оценок пока нет
Web Developer A Complete Guide - 2019 Edition
От Everand
Web Developer A Complete Guide - 2019 Edition
Gerardus Blokdyk
Оценок пока нет
MDM of Product Data Solutions Second Edition
От Everand
MDM of Product Data Solutions Second Edition
Gerardus Blokdyk
Оценок пока нет
Analysing Ad Budget
Документ4 страницы
Analysing Ad Budget
Srikanth
100% (1)
Operations Research
Документ35 страниц
Operations Research
Fida Al Hasan
Оценок пока нет
QWE Case Study
Документ5 страниц
QWE Case Study
Shubhendra vatsa
Оценок пока нет
2 Forecast Accuracy
Документ26 страниц
2 Forecast Accuracy
natalie clyde mates
Оценок пока нет
Machine Learning Hands-On Programs Program 1: Linear Regression - Single Variable Linear Regression
Документ22 страницы
Machine Learning Hands-On Programs Program 1: Linear Regression - Single Variable Linear Regression
KANTESH kantesh
100% (1)
Data Mining
Документ33 страницы
Data Mining
muluken
Оценок пока нет
Week 3 Teradata Exercise Guide: Managing Big Data With Mysql Dr. Jana Schaich Borg, Duke University
Документ6 страниц
Week 3 Teradata Exercise Guide: Managing Big Data With Mysql Dr. Jana Schaich Borg, Duke University
Nuts
Оценок пока нет
DDM HW1 Akash Srivastava
Документ14 страниц
DDM HW1 Akash Srivastava
Akash Srivastava
100% (2)
Data Visualization Strategy Standard Requirements
От Everand
Data Visualization Strategy Standard Requirements
Gerardus Blokdyk
Оценок пока нет
Data Preparation Process PDF
Документ30 страниц
Data Preparation Process PDF
Irfan Zubair
Оценок пока нет
Graph Analytics A Clear and Concise Reference
От Everand
Graph Analytics A Clear and Concise Reference
Gerardus Blokdyk
Оценок пока нет
MTCARS Regression Analysis
Документ5 страниц
MTCARS Regression Analysis
Erick Costa de Farias
Оценок пока нет
Credit EDA Assignment PDF
Документ40 страниц
Credit EDA Assignment PDF
Alisha Anand
Оценок пока нет
L03B-Dimensional Modeling II
Документ36 страниц
L03B-Dimensional Modeling II
Frans Sitohang
Оценок пока нет
Group Assignment - Data Mining
Документ28 страниц
Group Assignment - Data Mining
Simran Saha
Оценок пока нет
Sole Toolkit (Self Organised Learning Environment)
Документ25 страниц
Sole Toolkit (Self Organised Learning Environment)
Philip Finlay Bryan
Оценок пока нет
Sole Toolkit (Self Organised Learning Environment)
Документ25 страниц
Sole Toolkit (Self Organised Learning Environment)
Philip Finlay Bryan
Оценок пока нет
Sole Toolkit (Self Organised Learning Environment)
Документ25 страниц
Sole Toolkit (Self Organised Learning Environment)
Philip Finlay Bryan
Оценок пока нет
This Is The Final
Документ1 страница
This Is The Final
Anonymous
Оценок пока нет
BookletOF THEB SBBDUSNND
Документ4 страницы
BookletOF THEB SBBDUSNND
Anonymous
Оценок пока нет
Ansia I Haz 102005 Analysis
Документ99 страниц
Ansia I Haz 102005 Analysis
Anonymous
Оценок пока нет
Business Continuity Planning
Документ56 страниц
Business Continuity Planning
Anonymous
Оценок пока нет
Maina, Eunice W - The Effects of Peer Pressure A Case Study of The Public Service, Nairobi County PDF
Документ70 страниц
Maina, Eunice W - The Effects of Peer Pressure A Case Study of The Public Service, Nairobi County PDF
Anonymous
Оценок пока нет
Misanya, Sophy M - Peer Influence On Academic Performance of Form One Students in Girls Boarding Secondary Schools in Kanduyi Constituency Kenya PDF
Документ118 страниц
Misanya, Sophy M - Peer Influence On Academic Performance of Form One Students in Girls Boarding Secondary Schools in Kanduyi Constituency Kenya PDF
Anonymous
Оценок пока нет
Above Security Cantoe Robert Potvin
Документ36 страниц
Above Security Cantoe Robert Potvin
Anonymous
Оценок пока нет
A Study On The Effects of Music To The Academic Performance of The Students in Amacc-Caloocan
Документ17 страниц
A Study On The Effects of Music To The Academic Performance of The Students in Amacc-Caloocan
Anonymous
Оценок пока нет
Cat 24M
Документ24 страницы
Cat 24M
Marcelo Cardozo
Оценок пока нет
Peer Pressure
Документ11 страниц
Peer Pressure
Elisha_moxybee_8751
Оценок пока нет
29
Документ12 страниц
29
Nordiyana Yusof
Оценок пока нет
Kimley Horn
Документ6 страниц
Kimley Horn
Anonymous
Оценок пока нет
PIIT Starter Cal Portrait
Документ1 страница
PIIT Starter Cal Portrait
Hà Phương
Оценок пока нет
Lecture 7 - CH 3 Forecasting - 1spp
Документ58 страниц
Lecture 7 - CH 3 Forecasting - 1spp
satyavani
Оценок пока нет
Data Analysis and Interpretation
Документ83 страницы
Data Analysis and Interpretation
Mhmd Habbosh
Оценок пока нет
Homework Assignment Meeting 5
Документ10 страниц
Homework Assignment Meeting 5
Marwah Fazli
Оценок пока нет
Jal Basis Info Und Analysis
Документ194 страницы
Jal Basis Info Und Analysis
Erhanbaba
Оценок пока нет
Lecture 2 S1 - AY2022.23 - Cost Behaviors, Drivers and Estimation - Student
Документ44 страницы
Lecture 2 S1 - AY2022.23 - Cost Behaviors, Drivers and Estimation - Student
Gautham Pushpanathan
Оценок пока нет
Girish Chadha - 29th December 2022
Документ35 страниц
Girish Chadha - 29th December 2022
Girish Chadha
100% (3)
109 Data Science Interview Questions and Answers - Springboard Blog
Документ11 страниц
109 Data Science Interview Questions and Answers - Springboard Blog
Samarveer Singh
100% (1)
Anomaly Prediction in Mobile Networks: A Data Driven Approach For Machine Learning Algorithm Selection
Документ7 страниц
Anomaly Prediction in Mobile Networks: A Data Driven Approach For Machine Learning Algorithm Selection
Lanceloth01
Оценок пока нет
Simultaneous Equations Models
Документ30 страниц
Simultaneous Equations Models
NISHANT
Оценок пока нет
Regression Problems in Python PDF
Документ34 страницы
Regression Problems in Python PDF
mathew
Оценок пока нет
CH 09
Документ172 страницы
CH 09
Erkan
Оценок пока нет
Appendix E - The Linear Regression Model in Matrix Form
Документ14 страниц
Appendix E - The Linear Regression Model in Matrix Form
Islani Abdessamad
Оценок пока нет
Statistics For Management (BBA-303) : Introduction - 1
Документ10 страниц
Statistics For Management (BBA-303) : Introduction - 1
sendreceivemails7803
Оценок пока нет
Measures of Correlation Module
Документ24 страницы
Measures of Correlation Module
Meynard Magsino
Оценок пока нет
Chapter 5
Документ16 страниц
Chapter 5
Edward
Оценок пока нет
Review of Multiple Regression: Assumptions About Prior Knowledge. This Handout Attempts To Summarize and Synthesize
Документ12 страниц
Review of Multiple Regression: Assumptions About Prior Knowledge. This Handout Attempts To Summarize and Synthesize
Kiran Poudel
Оценок пока нет
McCullough, Tsang & Brion 2003 Personality Traits in Adolescence As Predictors of Religiousness in Early Adulthood - Findings From The Terman Longitudinal Study
Документ13 страниц
McCullough, Tsang & Brion 2003 Personality Traits in Adolescence As Predictors of Religiousness in Early Adulthood - Findings From The Terman Longitudinal Study
hoorie
Оценок пока нет
Quality of Analytical Measurements: Univariate Regression: 2009 Elsevier B.V. All Rights Reserved
Документ43 страницы
Quality of Analytical Measurements: Univariate Regression: 2009 Elsevier B.V. All Rights Reserved
Calidad Lass
Оценок пока нет
Influence of Factors in Green Advertising Upon Purchase Intentions-A Study of Pakistani University Students
Документ8 страниц
Influence of Factors in Green Advertising Upon Purchase Intentions-A Study of Pakistani University Students
sajjad ali khan
Оценок пока нет
The Sage Encyclopedia of Social Science Research Methods
Документ9 страниц
The Sage Encyclopedia of Social Science Research Methods
andy1andy0
Оценок пока нет
Effect of Service Quality On Customer Loyalty: A Study of Hotels in Ethiopia
Документ10 страниц
Effect of Service Quality On Customer Loyalty: A Study of Hotels in Ethiopia
IAEME Publication
Оценок пока нет
Age As A Risk Factor For Burnout Syndrome in Nursing Professionals. A Meta-Analysis
Документ12 страниц
Age As A Risk Factor For Burnout Syndrome in Nursing Professionals. A Meta-Analysis
maria blanca cuenca
Оценок пока нет
Linear Regression: Jia-Bin Huang Virginia Tech
Документ59 страниц
Linear Regression: Jia-Bin Huang Virginia Tech
Mr. Raghunath Reddy
Оценок пока нет
Neema Thesis Vfinal
Документ58 страниц
Neema Thesis Vfinal
Christian Vermehren
Оценок пока нет
Bi-Variate Linear Regression Analysis
Документ15 страниц
Bi-Variate Linear Regression Analysis
26 USAID JAMEEL NAZIR
Оценок пока нет
Machine Learning Cheat Sheet ??? - ?
Документ231 страница
Machine Learning Cheat Sheet ??? - ?
Mahesh Gulla
Оценок пока нет
7th Gcbss - Proceeding - Full Papers
Документ189 страниц
7th Gcbss - Proceeding - Full Papers
Lemlit Unirow Tuban
100% (1)
Focus Questions For Laura Martin
Документ10 страниц
Focus Questions For Laura Martin
Eyiram Adanu
100% (2)
Gujarat Technological University
Документ8 страниц
Gujarat Technological University
patel
Оценок пока нет
M. Amir Hossain PHD: Course No: Emba 502: Business Mathematics and Statistics
Документ31 страница
M. Amir Hossain PHD: Course No: Emba 502: Business Mathematics and Statistics
SP Vet
Оценок пока нет