-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathquiz2.R
65 lines (55 loc) · 2.34 KB
/
quiz2.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
# question 2
con <- url('http://simplystatistics.tumblr.com/', 'r')
simplyStats <- readLines(con, 150)
nchar(simplyStats)[c(2,45,122)]
# question 3
fileUrl <- 'https://dl.dropbox.com/u/7710864/data/csv_hid/ss06hid.csv'
download.file(fileUrl,destfile="./housingData.csv",method="curl")
housingData <- read.csv('housingData.csv')
length(which(housingData$VAL == 24))
# question 5
length(which(housingData$BDS == 3 & housingData$RMS == 4))
length(which(housingData$BDS == 2 & housingData$RMS == 5))
length(which(housingData$BDS == 2 & housingData$RMS == 7))
# question 6
agricultureLogical <- housingData$ACR == 3 & housingData$AGS == 6
head(housingData[which(agricultureLogical), 1:2], 3) # show only the two first variables (columns)
# question 7
agricultureLogical <- housingData$ACR == 3 & housingData$AGS == 6
indexes <- which(agricultureLogical)
subsetDataFrame = housingData[indexes, ]
sum(is.na(subsetDataFrame$MRGX))
# question 8
strsplit(names(housingData), 'wgtp')[123]
# question 9
quantile(housingData$YBL, na.rm=T)
# wrong values: according to the code book (https://dl.dropbox.com/u/7710864/data/PUMSDataDict06.pdf) YBL variavle shouldn't have value -1
# question 10
fileUrl <- 'https://dl.dropbox.com/u/7710864/data/csv_hid/ss06pid.csv'
download.file(fileUrl2,destfile="./populationData.csv",method="curl")
populationData <- read.csv('populationData.csv')
resultDataSet <- merge(housingData, populationData, by = 'SERIALNO')
dim(resultDataSet)
#optional
head(resultDataSet, 10)
summary(quiz2File$YBL, na.rm=T)
i <- quiz2File$YBL==-1
quiz2File[which(quiz2File$YBL$YBL==-1),]
quiz2File[which(quiz2File$YBL==-1),]
fileUrl <- 'https://dl.dropbox.com/u/7710864/data/csv_hid/ss06hid.csv'
download.file(fileUrl,destfile="./quiz2.csv",method="curl")
fileUrl <- 'https://dl.dropbox.com/u/7710864/data/csv_hid/ss06pid.csv'
download.file(fileUrl2,destfile="./quiz2_10.csv",method="curl")
housingData <- read.csv('quiz2.csv')
populationData <- read.csv('quiz2_10.csv')
?merge
resultDataSet <- merge(housingData, populationData, by.x='SERIALNO', by.y='SERIALNO')
dim(resultDataSet)
head(resultDataSet, 3)
resultDataSet <- merge(housingData, populationData, by = 'SERIALNO')
head(resultDataSet, 3)
dim(resultDataSet)
188+239
resultDataSet <- merge(housingData, populationData)
resultDataSet <- merge(housingData, populationData, by = "SERIALNO")
savehistory("~/workspace/R/quiz2.R")