-
Notifications
You must be signed in to change notification settings - Fork 6
/
Copy pathscatter.R
executable file
·76 lines (58 loc) · 2.59 KB
/
scatter.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
#!/usr/bin/env Rscript
library(ggplot2)
places = c(
"bayarea",
"manchester",
"seattle",
"vancouver",
"haiti",
"london",
"amsterdam",
"cairo",
"tirana"
)
scales = c(
"250m",
"500m",
"1000m"
)
# Loop over each possible tsv filename exported from Python script:
for (place in places) {
for (scale in scales) {
inputfile = paste0('/Users/alan/github/mapgardening/outputv4_', place, '_raster_', scale, '.tsv')
# If filename doesn't exist, skip it
if (!file.exists(inputfile)) {
cat("skipping", inputfile, "\n")
next
}
cat("reading", place, "from file", inputfile, "\n")
classes <- c("numeric", "character", "numeric", "numeric", "numeric", "Date", "Date", "Date", "numeric", "Date", "Date")
# specify quote and comment.char to avoid catching "#" or "'"
frame <- read.table(inputfile, sep="\t", quote="", comment.char="", header=TRUE, na.strings = "NULL", colClasses=classes)
names(frame) = c("uid", "username", "edits", "blankedits", "v1edits", "firstedit", "firsteditv1", "firsteditblank", "days_active", "mean_date", "mean_date_weighted")
attach(frame)
outputfile = paste0('/Users/alan/github/mapgardening/outscattersingle4_total-v-blank_', place, '_', scale, '.png')
#pdf(outputfile, 7, 7) # Create a PDF of 7 by 7 inches
png(outputfile, 600, 600)
# Add 0.1 to x and y to avoid problems with the log scale
a <- ggplot(data = frame, aes(x = jitter(edits+0.1, 0.01), y = jitter(blankedits+0.1, 0.01), col=days_active)) +
#stat_smooth(formula="y ~ x", na.rm=TRUE, method="lm") +
#stat_smooth(formula="y ~ poly(x,2)", na.rm=TRUE, method="lm") +
#stat_smooth(formula="y ~ a * log(x+0.1) + b", na.rm=TRUE, method="lm") +
#stat_smooth(formula="y ~ a * exp(b *x)", na.rm=TRUE, method="lm") +
geom_point(aes(size = days_active)) +
scale_x_log10("Log total edits") + scale_y_log10("Log blankspot edits") +
ggtitle(paste0(place, '_', scale)) + scale_color_continuous(name = "days active")
print(a)
dev.off()
outputfile = paste0('/Users/alan/github/mapgardening/output_meaneditdate_', place, '_', scale, '.png')
png(outputfile, 600, 600)
# Add 0.1 to x and y to avoid problems with the log scale
a <- ggplot(data = frame, aes(x = mean_date_weighted, y = jitter(blankedits+0.1, 0.01), col=days_active)) +
geom_point(aes(size = days_active)) +
scale_x_date("Mean edit date weighted") + scale_y_log10("Log blankspot edits") +
ggtitle(paste0(place, '_', scale)) + scale_color_continuous(name = "days active")
print(a)
dev.off()
detach(frame)
}