Professional Documents
Culture Documents
EXPT NO: 9
DATE:30/09/2022
REG. NO.:20BEC1351
AIM
R PROGRAM
rm(list=ls())
data <-read.csv("C:\\Users\\dsp\\Desktop\\20be1351\\Credit.csv")
data
# install.packages("ggplot2")
library("ggplot2")
library(dplyr)
cmatrix
# install.packages("reshape2")
library(reshape2)
cmatrix_melted
OUTPUT
CSE3505 – FOUNDATIONS OF DATA ANALYTICS
EXPT NO: 10
DATE:07/10/2022
LINEAR REGRESSION
AIM
R PROGRAM
rm(list=ls())
data<-read.csv("C:\\Users\\dsp\\Desktop\\20be1351\\insurance.csv")
data
x<-data$bmi
y<-data$charges
#regression
reg=lm(y~x)
reg
(summary(reg))
#plotting
plot(x,y)
abline(reg)
a=data.frame(x=30)
predict(reg,a)
OUTPUT
CSE3505 – FOUNDATIONS OF DATA ANALYTICS
EXPT NO: 11
DATE:21/10/2022
REG. NO.:20BEC1351
AIM
R PROGRAM
rm(list=ls())
ggplot(data,aes(x=Cdur,y=Camt))+geom_point()
cor.test(data$Cdur,data$Camt)
qqline(slr$resid)
plot(slr,which =2)
mlr = lm(Cdur~Camt+age, data)
summary(mlr)
plot(mlr$resid)
qqline(mlr$resid)
plot(mlr,which =2)
OUTPUT
CSE3505 – FOUNDATIONS OF DATA ANALYTICS
EXPT NO: 12
DATE:04-11-2022
REG. NO.:20BEC1351
R PROGRAM
rm(list=ls())
data_a <-read.csv("C:\\Users\\asmih\\Desktop\\R prog\\Credit.csv")
library(dplyr)
data_credit <- sample_n(data_a,100)
# install.packages("sqldf")
library(sqldf)
df1 <- sqldf("Select * from data_credit")
df2 <- sqldf("select camt from data_credit")# Select
df3 <- sqldf('select "age" from data_credit')# Select
df4 <- sqldf("select * from data_credit LIMIT 5") # Head
df5 <- sqldf("select * from data_credit ORDER BY cdur desc") # Sorting
df6 <- sqldf("select age from data_credit WHERE age > 30") # Filtering
df7 <- sqldf("select cdur from data_credit WHERE cdur not in (11,13)") # Filtering - range
df8 <- sqldf('select * from data_credit WHERE prop LIKE "real estate"') # Filtering - category
df9 <- sqldf("select avg(cdur) as avg_cdur, avg(camt) as avg_cmt, age from data_credit WHERE
age > 30 GROUP BY age")
OUTPUT