summaryrefslogtreecommitdiffstats
path: root/R Scripts/-recover-data.R
diff options
context:
space:
mode:
authorBen Green <bgreen@g.harvard.edu>2015-06-08 15:21:51 -0400
committerBen Green <bgreen@g.harvard.edu>2015-06-08 15:21:51 -0400
commit1739e9f5706bb8a73de5dbf0b467de49ea040898 (patch)
tree6f1d0f166986c5f0757be9b40d8eeb3409ab022c /R Scripts/-recover-data.R
parente5dada202c34521618bf82a086093c342841e5e8 (diff)
downloadcriminal_cascades-1739e9f5706bb8a73de5dbf0b467de49ea040898.tar.gz
added my R scripts
Diffstat (limited to 'R Scripts/-recover-data.R')
-rwxr-xr-xR Scripts/-recover-data.R27
1 files changed, 27 insertions, 0 deletions
diff --git a/R Scripts/-recover-data.R b/R Scripts/-recover-data.R
new file mode 100755
index 0000000..b34ffc6
--- /dev/null
+++ b/R Scripts/-recover-data.R
@@ -0,0 +1,27 @@
+library(igraph)
+setwd("/Users/Ben/Documents/Harvard/Fall 2014/CS 284r Social Data Mining/Cascade Project/")
+
+el = read.csv('Data/dag.csv')
+lcc = induced.subgraph(d,which(clusters(d)$membership==which.max(clusters(d)$csize)))
+vic_ids = which(V(lcc)$vic==TRUE)
+
+from = vic_ids[el$from]
+to = vic_ids[el$to]
+
+t1 = as.Date(V(lcc)$vic_date[from],format='%m/%d/%y')
+t2 = as.Date(V(lcc)$vic_date[to],format='%m/%d/%y')
+
+uf = unique(from)
+dist = rep(0,length(from))
+for (i in 1:length(uf)){
+ if (i%%1000==0) print(i)
+ f = uf[i]
+ fi = which(from==f)
+ ds = as.numeric(shortest.paths(lcc,v=f,to=to[fi]))
+ dist[fi] = ds
+}
+
+dag_dat = data.frame(from=el$from,to=el$to,dist,t1,t2)
+
+save(dag_dat,file='Data/dag_dat.RData')
+write.csv(dag_dat,'Data/dag_dat.csv')