box-o-sand/PracticingR/elementary-statistics/.Rhistory

368 lines
10 KiB
R
Raw Normal View History

2011-07-11 08:54:45 +00:00
library(MASS)
painters
painters$School
school = painters$School
school.freq = table(school)
school.freq
cbind(school.freq)
head(painters)
composition = painters$Composition
composition.freq = table(composition)
cbind(composition.freq)
school
school.freq
school.freq[1]
help(max)
school[,][1]
school[1,][1]
school[1][1]
school[1]
school.freq[1,]
school.freq[1]
school.freq[1][1]
school.freq[1]
help(typeof)
typeof(school.freq[1])
max(school.freq)
max(school)
max(school.freq)
school.relfreq = school.freq / nrow(painters)
school.relfreq
settings = options(digits=1)
school.relfreq
options(settings)
cbind(school.relfreq)
composition.freq
composition.relfreq = composition.freq / nrow(composition)
composition.relfreq = composition.freq / nrow(painters)
composition.relfreq
cbind(composition.relfreq)
# bar graph exercise
library(MASS)
school = painters$School
school.freq = table(school)
barplot(school.freq)
colors = c("red", "yellow", "green", "violet", "orange", "blue", "pink", "cyan")
barplot(schools.freq, col=colors)
barplot(school.freq, col=colors)
composition = painters$Composition
composition.freq = table(composition)
count.fields(composition.freq)
ncol(composition.freq)
composition.freq
nrow(composition.freq)
nrow(school.freq)
colors
barplot(composition.freq, col=colors)
q()
2011-07-11 09:35:43 +00:00
library(MASS)
school = painters$school
school
school = painters$School
school
school.freq = table(school)
pip(school.freq)
pie(school.freq)
colors = c("red", "yellow", "green", "violet", "orange", "blue", "pink", "cyan")
pie(school.freq, col=colors)
composition = painters$Composition
composition.freq = table(composition)
pip(composition.freq, col=colors)
pie(composition.freq, col=colors)
library(MASS)
school = painters$School
c_school = school == "C"
c_painters = painters[c_school,]
mean(c_painters$Composition)
pie(tapply(painters$Composition, painters$School, mean)
pie(tapply(painters$Composition, painters$School, mean))
barchart(tapply(painters$Composition, painters$School, mean))
barplot(tapply(painters$Composition, painters$School, mean))
q()
head(faithful)
duration = faithful$eruptions
range(duration)
breaks = seq(1.5, 5.5, by=0.5)
breaks
duration.cut = cut(duration, breaks, right=FALSE)
duration.freq = table(duration.cut)
duration.freq
cbind(duration.freq)
barplot(duration.freq)
nrow(faithful)
faithful$eruptions / nrow(faithful)
help(hist)
hist(faithful$eruptions)
faithful)
head(faithful)
hist(faithful$waiting)
hist(faithful)
help(barplot)
VADeaths
help(demo)
demo()
demo("graphics")
hist(faithful$waiting)
interval = faithful$waiting
interval
range(interval)
breaks = seq(43, 96, by=1)
breaks
interval.cut = cut(interval, breaks, right=FALSE)
interval.freq = table(interval.cut)
barplot(interval.freq)
breaks = seq(43, 96, by=5)
breaks
interval.cut = cut(interval, breaks, right=FALSE)
interval.freq = table(interval.cut)
barplot(interval.freq)
help(points)
points(interval.freq)
barplot(interval.freq)
hist(faithful$eruptions, right=FALSE)
duration = faithful$eruptions
hist(duration, right=FALSE)
colors = c("red", "yellow", "green", "violet", "orange", "blue", "pink", "cyan")
hist(duration, right=FALSE, col=colors, main="Old Faithful Eruptions", xlab="Duration minutes")
waiting_period = faithful$waiting
waiting_period = faithful$waiting
hist(waiting_period, right=FALSE, col=colors, main="Old Faithful Eruptions", xlab="Interval")
hist(waiting_period, right=FALSE, col=colors, main="Old Faithful Eruptions", xlab="Interval in minutes")
q()
2011-07-13 01:32:36 +00:00
duration = faithful$eruptions
breaks = seq(1.5, 5.5, by=0.5)
duration.cut = cut(duration, breaks, right=FALSE)
duration.freq = table(duration.cut)
duration.relfreq = duration.freq / nrow(faithful)
duration.relfreq
pie(duration.relfreq)
hist(duration.relfreq)
hist(duration.relfreq)
duration.freq
duration = faithful$eruptions
breaks = seq(1.5, 5.5, by=0.5)
breaks
typeof(breaks)
duration.cut = cut(duration, breaks, right=FALSE)
duration.freq = table(duration.cut)
duration.cumfreq = cumsum(duration.freq)
duration.cumfreq
hist(cbind(duration.cumfreq))
interval = faithful$waiting
help(function)
help("function")
help("function")
calc_cumfreq <- function(records)
breaks = seq(1.5, 5.5, by=0.5)
records.cut = cut(duration, breaks, right=FALSE)
records.freq = table(duration.cut)
records.cumfreq = cumsum(records.freq)
return(records)
calc_cumfreq <- function(records)
breaks = seq(1.5, 5.5, by=0.5)
records.cut = cut(records, breaks, right=FALSE)
help("function")
duration.cumfreq
interval = faithful$eruptions
breaks
breaks.cut = cut(interval, breaks, right=FALSE)
interval.freq = table(interval.cut)
interval.cumfreq = cumsum(interval.freq)
hist(interval.cumfreq)
q()
2011-07-13 01:55:11 +00:00
duration = faithful$eruptions
breaks = seq(1.5, 5.5, by=0.5)
duration.cut = cut(duration, breaks, right=FALSE)
duration.freq = table(duration.cut)
cumfreq0 = c(0, cumsum(duration.freq))
plot(breaks, cumfreq0, main="Old Faithful Eruptions", xlab="Duration minutes", ylab="Cumulative Eruptions")
lines(breaks, cumfreq0)
intervals = faithful$waiting
faithful$waiting
cbind(faithful$waiting)
faithful$waiting / nrow(faithful)
faithful$waiting / nrow(faithful$waiting)
intervals
breaks
intervals.cut = cut(breaks, intervals)
help(cut)
intervals.cut = cut(intervals, breaks)
intervals.cut
intervals.cut
intervals.freq = table(intervals.cut)
intervals.cut = cut(intervals, breaks, right=FALSE)
intervals.freq = table(intervals.cut)
cumfreq0 = c(0, cumsum(intervals.freq))
cumfreq0
intervals
intervals.cut = cut(intervals, breaks, right=FALSE)
intervals.cut
intervals.freq = table(intervals.cut)
intervals.freq
cbind(intervals.freq)
plot(breaks, cumfreq0)
intervals
cut(intervals, breaks)
cut(intervals, breaks, right=FALSE)
duration
cut(duration, breaks)
breaks = seq(0, 100, by=10)
breaks
cut(intervals, breaks)
intervals.cut = cut(intervals, breaks)
intervals.cut = cut(intervals, breaks, right=FALSE)
intervals.cut
intervals.freq = table(intervals.cut)
cumfreq0 = c(0, cumsum(intervals.freq))
cumfreq0
plot(breaks, cumfreq0)
lines(breaks, cumfreq0)
intervals
min(intervals)
max(intervals)
breaks = seq(40.0, 100.0, by=5.0)
intervals.cut = cut(intervals, breaks, right=FALSE)
intervals.cut
floor?
help(floor)
intervals.freq = table(intervals.cut)
intervals.freq
cumfreq0 = c(0, cumsum(intervals.freq))
cumfreq0
plot(breaks, cumfreq0)
lines(breaks, cumfreq0)
plot(breaks, cumfreq0, main="Old Faithful Intervals", xlab="Interval minutes", ylab="Cumulative Intervals")
lines(breaks, cumfreq0)
q()
2011-07-13 02:04:59 +00:00
duration = faithful$eruptions
breaks = seq(1.5, 5.5, by=0.5)
duration.cut = cut(duration, breaks, right=FALSE)
duration.freq = table(duration.cut)
duration.cumfreq = cumsum(duration.freq)
duration.cumrelfreq = duration.cumfreq / nrow(faithful)
duration.cumrelfreq
old = options(digits=2)
duration.cumrelfreq
options(old)
duration.cumrelfreq
cbind(duration.cumfreq, duration.cumrelfreq)
interval = faithful$waiting
min(interval)
max(interval)
ceiling(max(interval))
help(ceiling)
interval * 0.10
max(interval) * 0.1)
ceiling(max(interval) * 0.1)
interval_breaks = seq(floor(min(interval) * 0.1) * 10.0, ceiling(max(interval) * 0.1) * 10.0, right=FALSE)
interval_breaks
interval_breaks = seq(floor(min(interval) * 0.1) * 10.0, ceiling(max(interval) * 0.1) * 10.0, by=nrow(interval) / 10.0, right=FALSE)
interval_breaks = seq(floor(min(interval) * 0.1) * 10.0, ceiling(max(interval) * 0.1) * 10.0, by=(nrow(faithful) / 10.0), right=FALSE)
interval_breaks
interval_breaks = seq(floor(min(interval) * 0.1) * 10.0, ceiling(max(interval) * 0.1) * 10.0, by=(nrow(faithful) / 5.0), right=FALSE)
interval_breaks
interval_breaks = seq(floor(min(interval) * 0.1) * 10.0, ceiling(max(interval) * 0.1) * 10.0, by=(nrow(faithful) / 20.0), right=FALSE)
interval_breaks
interval_breaks = seq(floor(min(interval) * 0.1) * 10.0, ceiling(max(interval) * 0.1) * 10.0, by=(nrow(faithful) / 30.0), right=FALSE)
interval_breaks
interval_breaks = seq(floor(min(interval) * 0.1) * 10.0, ceiling(max(interval) * 0.1) * 10.0, by=5.0 right=FALSE)
interval_breaks = seq(floor(min(interval) * 0.1) * 10.0, ceiling(max(interval) * 0.1) * 10.0, by=5.0, right=FALSE)
interval_breaks
length(interval_breaks)
type(interval_breaks)
typeof(interval_breaks)
interval
interval.freq
interval.cut = cut(interval, interval_breaks, right=FALSE)
interval.cut
interval.freq = table(interval.cut)
interval.cumfreq = cumsum(interval.freq)
interval.cumfreq
interval.cumrelfreq = interval.cumfreq / nrow(faithful)
interval.cumrelfreq
cbind(interval.cumfreq, interval.cumrelfreq)
q()
2011-07-14 02:25:42 +00:00
c(duration.freq)
duration.freq)
duration.freq
c(0, duration.freq)
cumfreq0
cumfreq0 = c(0, cumsum(duration.freq))
cumfreq0
cumrelfreq0 = cumfreq0 / nrow(faithful)
cumrelfreq0
breaks
plot(breaks, cumrelfreq0, main="Old Faithful Eruptions", xlab="Duration minutes", ylab="Cumulative Eruptions Proportion")
lines(breaks, cumrelfreq0)
library(actuar)
help("library")
library(actuar)
help(ogive)
Fn = ogive(breaks, duration.freq)
plot(Fn, main="Old Faithful Eruptions", xlab="Duration minutes", ylab="Cumulative Relative Frequency")
library(PBSModelling)
library(PBSModeling)
library(PBSmodelling)
plotCsum(duration)
intervals
intervals.cut
interval_breaks
interval
intervals
interval.cut
interval.freq
intervalFn = ogive(breaks, interval.freq)
intervalFn = ogive(interval_breaks, interval.freq)
plot(intervalFn, main="Old Faithful Eruptions", xlab="Intervals in minutes", ylab="Cumulative Relative Frequency")
plotCsum(interval)
q()
2011-07-14 02:29:16 +00:00
duration
stem(duration)
interval
stem(interval)
interval
help(stem)
q()
2011-07-14 02:38:38 +00:00
waiting = faithful$waiting
head(cbind(duration, waiting))
plot(duration, waiting, xlab="Eruption duration", ylab="Time waited")
par()
plot(1:10, 1:10, type="n")
help("font")
??font
# the above was a brief excursion into font settings and such
abline(lm(waiting - duration))
plot(duration, waiting, xlab="Eruption duration", ylab="Time waited")
abline(lm(waiting - duration))
abline(lm(waiting ~ duration))
q()
2011-07-14 02:43:58 +00:00
mean(duration)
mean(interval)
??points
median(duration)
median(interval)
quantile(duration)
quantile(interval)
quantile(duration, c(.32, .57, .98))
quantile(interval, c(.17, .43, .67, .85))
q()
q()
2011-07-15 03:04:37 +00:00
max(duration)
min(duration)
max(interval) - min(interval)
IQR(duration)
IQR(interval)
boxplot(duration, horizontal=TRUE)
boxplot(interval, horizontal=TRUE)
q
q()
2011-07-15 11:36:50 +00:00
var(duration)
var(interval)
max(interval) - min(interval)
sd(duration)
sd(interval)
waiting
interval == waiting
cov(duration, waiting)
q()