diff --git a/extract-twitter-accounts.R b/extract-twitter-accounts.R index 746eb31..4cb976e 100644 --- a/extract-twitter-accounts.R +++ b/extract-twitter-accounts.R @@ -1,11 +1,11 @@ # PREPARATIONS ------------------------------------------------------------ - require(jsonlite) require(stringr) require(RCurl) require(devtools) require(RTwitterAPI) +require(lubridate) setwd("~/Dokumente/Uni/Aktuell/BA-Arbeit/uni-ba-issuecomp") @@ -166,11 +166,11 @@ rm(a, code, current, error, loop, max_id, name, query, r, status, user, wait, tw # CLEAR DATAFRAME --------------------------------------------------------- -tweets <- tweets_bak +save(tweets_complete, file="tweets_complete.RData") # Remove duplicates tweets <- tweets_complete[!duplicated(tweets_complete), ] -save(tweets_complete, file="tweets_complete.RData") +tweets <- na.omit(tweets) save(tweets, file="tweets.RData") rm(tweets_complete) @@ -193,5 +193,15 @@ for(r in 1:nrow(tweets)) { tweets <- tweets[-delrow, ] rm(delrow, r) +# Convert dates to omit (unnecessary) time +tweets$created_at <- format(tweets$created_at, "%Y-%m-%d") +# Create date range +date_start <- as.Date("2014-01-01") +date_end <- as.Date("2014-12-01") +drange <- as.integer(date_end - date_start) +drange <- date_start + days(0:d) +issues <- data.frame(date = drange) +# Select all tweets from current day in drange +tweets_curday <- tweets[tweets[, "created_at"] == drange[5], ]