[tor-commits] [metrics-tasks/master] Remove outdated censorship detector code (#2718).

karsten at torproject.org karsten at torproject.org
Tue Aug 9 13:59:09 UTC 2011


commit 4426cf9cfa1d8965057c3fe34184c5ce459fa390
Author: Karsten Loesing <karsten.loesing at gmx.net>
Date:   Tue Aug 9 15:52:38 2011 +0200

    Remove outdated censorship detector code (#2718).
---
 task-2718/README                |   27 --------------------
 task-2718/convert-dirreqs-sql.R |    8 ------
 task-2718/detect-censorship.R   |   52 ---------------------------------------
 3 files changed, 0 insertions(+), 87 deletions(-)

diff --git a/task-2718/README b/task-2718/README
deleted file mode 100644
index 8c60847..0000000
--- a/task-2718/README
+++ /dev/null
@@ -1,27 +0,0 @@
-Here's how you run the censorship detector prototype:
-
-  $ wget https://metrics.torproject.org/csv/direct-users.csv
-  $ R --slave -f detect-censorship.R
-
--------------------------------------------------------------------------
-
-Extracting raw directory requests from the metrics-web database:
-
-- Export dirreq_stats table from the metrics-web database via psql:
-
-  # \f ','
-  # \a
-  # \t
-  # \o dirreqs-sql.csv
-  # SELECT * FROM dirreq_stats ORDER BY statsend;
-  # \o
-  # \t
-  # \a
-
-- Transform the huge (!) CSV file (104M) from long to wide format.  Note
-  that this takes a while:
-
-  $ R --slave -f convert-dirreqs-sql.R
-
-- The result is in dirreqs.csv (8.8M).
-
diff --git a/task-2718/convert-dirreqs-sql.R b/task-2718/convert-dirreqs-sql.R
deleted file mode 100644
index e330307..0000000
--- a/task-2718/convert-dirreqs-sql.R
+++ /dev/null
@@ -1,8 +0,0 @@
-library(ggplot2)
-data <- read.csv("dirreqs-sql.csv", header = FALSE)
-data <- data.frame(fingerprint = data$V1, statsend = data$V2,
-  seconds = data$V3, country = data$V4, requests = data$V5)
-data <- cast(data, fingerprint + statsend + seconds ~ country,
-  value = "requests")
-write.csv(data, file = "dirreqs.csv", quote = FALSE, row.names = FALSE)
-
diff --git a/task-2718/detect-censorship.R b/task-2718/detect-censorship.R
deleted file mode 100644
index f27e863..0000000
--- a/task-2718/detect-censorship.R
+++ /dev/null
@@ -1,52 +0,0 @@
-# Tor Censorship Detector
-# Usage: R --slave < detect-censorship.R
-
-# Read CSV file containing daily user number estimates.
-direct <- read.csv("direct-users.csv")
-
-# Start plotting everything to a single PDF (with multiple pages).
-pdf("detect-censorship.pdf")
-
-# Convert the column containing daily Iranian users to a time series
-# object, starting on the 263th day of 2009 with a frequency of 365 days.
-# We're probably off by a day or two, but this should be fine for now.
-all <- ts(direct$ir, start = c(2009, 263), frequency = 365)
-
-# Uncomment to print the time series values.
-#print(all)
-
-# Let's try our approach for the last 365 days to see if we detect any
-# blocking in that time period.  In the final version of this script, we'd
-# only have a single run with i = 1.
-for (i in 365:1) {
-  idx <- length(direct$date) - i
-
-  # Convert the daily Iranian users until i days in the past to a time
-  # series object.
-  x <- ts(direct$ir[1:idx], start = c(2009, 263), frequency = 365)
-
-  # Apply an ARIMA(1, 0, 1) model to the time series.
-  x.fit = arima(x, order = c(1, 0, 1))
-
-  # Predict 10 dates ahead.
-  x.fore=predict(x.fit, n.ahead=10)
-
-  # Calculate a lower bound.  Here we use the predicted value minus three
-  # standard errors.
-  L = x.fore$pred - 3*x.fore$se
-
-  # If the observed daily user number is lower than our predicted lower
-  # bound, plot the data and lower bound.
-  if (direct$ir[idx + 1] < L[1]) {
-
-    # Plot the full time series.
-    ts.plot(all)
-
-    # Add a line for the ten predicted values.
-    lines(L, col = "red", lwd = 2) 
-  }
-}
-
-# Close the PDF device.
-dev.off()
-





More information about the tor-commits mailing list