Analyzing Social Media Data in R
Sowmya Vivek
Data Science Coach
# Create tweet data frame for tweets on #OOTD
twts_OOTD <- search_tweets("#OOTD ", n = 18000, include_rts = TRUE)
# Create data frame for the network
rt_df <- twts_OOTD[, c("screen_name" , "retweet_screen_name" )]
head(rt_df,10)
screen_name retweet_screen_name
<chr> <chr>
ShesinfashionCc NA
glamwearplanet NA
lanacond0r LiveKellyRyan
animeninjaz NA
zeluslondon NA
IonaJaneLevy NA
# Remove rows with missing values
rt_df_new <- rt_df[complete.cases(rt_df), ]
# Convert to matrix
matrx <- as.matrix(rt_df_new)
# Create the retweet network
library(igraph)
nw_rtweet <- graph_from_edgelist(el = matrx, directed = TRUE)
# View the retweet network
print.igraph(nw_rtweet)
IGRAPH 7f42937 DN-- 4100 4616 --
+ attr: name (v/c)
+ edges from 7f42937 (vertex names):
[1] MaikielYungin ->ZingletC MaikielYungin ->ZingletC
[3] victoria_shop_1->victoria_shop_1 victoria_shop_1->victoria_shop_1
[5] victoria_shop_1->victoria_shop_1 victoria_shop_1->victoria_shop_1
[7] victoria_shop_1->victoria_shop_1 victoria_shop_1->victoria_shop_1
[9] victoria_shop_1->victoria_shop_1 w3daily ->RealFirstBuzz
[11] w3daily ->RealFirstBuzz w3daily ->RealFirstBuzz
[13] w3daily ->RealFirstBuzz w3daily ->RealFirstBuzz
[15] w3daily ->RealFirstBuzz w3daily ->RealFirstBuzz
Analyzing Social Media Data in R