further parallel improvements

This commit is contained in:
2015-02-22 16:16:01 +01:00
parent b32c2cba58
commit d7de9dda0c
3 changed files with 425 additions and 474 deletions
+3 -3
View File
@@ -40,7 +40,7 @@ writeLines(c(""), "issuecomp-analysis.log")
cl<-makeCluster(4)
registerDoParallel(cl)
df<-foreach(d = 1:nrow(issues), .packages = c("stringr"), .combine=rbind) %dopar% {
foreach(d = 1:nrow(issues), .packages = c("stringr"), .combine=rbind) %dopar% {
#for(d in 1:nrow(issues)) {
# Go through every day
curdate <- issues$date[d]
@@ -50,7 +50,7 @@ df<-foreach(d = 1:nrow(issues), .packages = c("stringr"), .combine=rbind) %dopar
tweets_curday <- tweets[tweets[, "created_at"] == curdate, ]
for(t in 1:nrow(tweets_curday)){
cat(paste("Starting tweet", t, "of",as.character(curdate),"\n"), file="issuecomp-analysis.log", append=TRUE)
# cat(paste("Starting tweet", t, "of",as.character(curdate),"\n"), file="issuecomp-analysis.log", append=TRUE)
# Select tweet's text, make it lowercase and remove hashtag indicators (#)
curtext <- as.character(tweets_curday$text[t])
curtext <- str_replace_all(curtext, "#", "")
@@ -110,7 +110,7 @@ df<-foreach(d = 1:nrow(issues), .packages = c("stringr"), .combine=rbind) %dopar
# Add information to file for function viewPatternMatching
write(str_c(curdate,";\"",curid,"\";",curissue,";",curtag), curfile, append = TRUE)
cat(paste("Match!\n"), file="issuecomp-analysis.log", append=TRUE)
# cat(paste("Match!\n"), file="issuecomp-analysis.log", append=TRUE)
# data.frame(date=curdate, issue=curissue)
break # next issue, no more tags from same issue
}