# Rproject10_flow_occ_regressions.r
# 1.0 Read in data ----
# See Problem 10.9.50,
# data from: http://pems.eecs.berkeley.edu
# For each of three lanes, the
# flow (number of cars)
# occupancy (percentage of time a car was over the loop)
#
# 1740 5-minute intervals
# Lane 1 farthest left lane, lane 2 center, lane 3 farthest right
flowocc=read.table(file="Rice 3e Datasets/ASCII Comma/Chapter 10/flow-occ.txt",
sep=",",stringsAsFactors = FALSE,
header=TRUE)
Timestamp2 = strptime(flowocc$Timestamp, "%m/%d/%Y %H:%M:%S")
#plot(Timestamp2, flowocc$Lane.1.Occ)
#plot(flowocc$Lane.1.Occ)
flowocc$Timestamp=Timestamp2
lmfit1=lm(Lane.3.Occ ~ Lane.1.Occ, data=flowocc)
plot(flowocc$Lane.1.Occ, flowocc$Lane.3.Occ)
lmfit1=lm(Lane.3.Occ ~ Lane.1.Occ, data=flowocc)
abline(lmfit1,col="green")
data:image/s3,"s3://crabby-images/a9cc9/a9cc902cb125abbbda0b7aa75bac65d0321744a6" alt=""
plot(flowocc$Lane.1.Occ, lmfit1$residuals)
abline(h=0,col="gray")
data:image/s3,"s3://crabby-images/a28ca/a28ca78b735bb36695aa5ae837420243b9837493" alt=""
qqnorm(lmfit1$residuals)
data:image/s3,"s3://crabby-images/dbed9/dbed94afd31e1354f8a03ab371295539e0ae58ff" alt=""
# Consider two subsets
ind.subset1=(flowocc$Lane.1.Occ < .18)
ind.subset2=(flowocc$Lane.1.Occ > .18)
# For first subset:
plot(flowocc$Lane.1.Occ[ind.subset1], flowocc$Lane.3.Occ[ind.subset1])
lmfit1.subset1=lm(Lane.3.Occ ~ Lane.1.Occ, data=flowocc, weight=1*ind.subset1)
abline(lmfit1.subset1,col="green")
data:image/s3,"s3://crabby-images/0b90a/0b90a48da420d70f44351c4fa75aa063a1bc9ca6" alt=""
plot(flowocc$Lane.1.Occ[ind.subset1], lmfit1.subset1$residuals[ind.subset1])
abline(h=0,col="gray")
data:image/s3,"s3://crabby-images/76617/76617c1e135bda0beb341b3e897fdcb534771f8f" alt=""
qqnorm(lmfit1.subset1$residuals[ind.subset1])
data:image/s3,"s3://crabby-images/f0339/f0339e3b2c70dd819f49bd585c9e20ffb59de50b" alt=""
# For second subuset:
plot(flowocc$Lane.1.Occ[ind.subset2], flowocc$Lane.3.Occ[ind.subset2])
lmfit1.subset2=lm(Lane.3.Occ ~ Lane.1.Occ, data=flowocc, weight=1*ind.subset2)
abline(lmfit1.subset2,col="green")
data:image/s3,"s3://crabby-images/dbb0c/dbb0cdcd840b78a4c781ab0cab495b3afa8d9869" alt=""
plot(flowocc$Lane.1.Occ[ind.subset2], lmfit1.subset2$residuals[ind.subset2])
abline(h=0,col="gray")
data:image/s3,"s3://crabby-images/c08ae/c08aeb963ad94ae30561c6e62f03bf00bf8d79ec" alt=""
qqnorm(lmfit1.subset2$residuals[ind.subset2])
data:image/s3,"s3://crabby-images/95069/950695efc0d4394b72f966eedb6746908c5f627a" alt=""
# For second subuset: