-
Notifications
You must be signed in to change notification settings - Fork 0
/
Multiple regresison: R.r
53 lines (40 loc) · 1.65 KB
/
Multiple regresison: R.r
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
#importing Dataset
dataset<-read.csv('50_Startups.csv')
#encode categorical data
dataset$State<-factor(dataset$State,
levels = c('New York','California', 'Florida'),
labels = c(1,2,3))
#spliting dataset into train and test
library(caTools)
set.seed(123)
split = sample.split(dataset$Profit,SplitRatio = 0.8)
training_set = subset(dataset, split == 'TRUE')
test_set = subset(dataset, split == 'FALSE')
#Fitting Multiple Linear regression to training set
#regressor = lm(formula = Profit ~ ., data =training_set)
#regressor = lm(formula = Profit ~ R.D.Spend + Administration + Marketing.Spend + State, data = training_set)
regressor = lm(formula = Profit ~ R.D.Spend, data = training_set)
summary(regressor)
#Predicting the test results
y_pred = predict(regressor, newdata = test_set)
#Building the optimal model using backword elimination
regressor = lm(formula = Profit ~ R.D.Spend + Administration + Marketing.Spend + State, data = training_set)
summary(regressor)
##Removing state2
regressor = lm(formula = Profit ~ R.D.Spend+Administration+Marketing.Spend+
factor(State ,exclude=c(2)),
data = training_set)
summary(regressor)
#removing state
regressor = lm(formula = Profit ~ R.D.Spend+Administration+Marketing.Spend,
data = training_set)
summary(regressor)
#removing Administration
regressor = lm(formula = Profit ~ R.D.Spend+Marketing.Spend,
data = training_set)
summary(regressor)
#removing Marketing.spend
regressor = lm(formula = Profit ~ R.D.Spend,
data = training_set)
summary(regressor)
y_pred = predict(regressor, newdata=test_set)