Commit 851fcdbd authored by Decoupes Remy's avatar Decoupes Remy
Browse files

building output to graph visualization with Gephi

parent 878a75fc
......@@ -6,8 +6,14 @@
},
"text",
"id",
"in_reply_to_status_id",
"extended_tweet.full_text",
"retweeted_status.id",
"user.location",
"entities.media.expanded_url",
"entities.urls.expanded_url",
"user.name",
"retweeted_status.user.name",
"rest.*"
],
"_source": false,
......
......@@ -137,3 +137,26 @@ if __name__ == '__main__':
df_tfidf["tf_idf_terms"] = df_tfidf.index
df_tfidf = df_tfidf.merge(df_results, on="index_of_tweet")
df_tfidf.to_csv("/home/rdecoupe/Téléchargements/acquitaine3.csv")
# prepare to Gephi for graph vizu
# gephi = df_results
# gephi["Source"] = gephi["id"]
# gephi["Target"] = gephi["retweeted_status.id"]
# gephi["ID"] = gephi.index
# gephi["Timestamp"] = gephi["@timestamp"]
# gephi["label"] = gephi["retweeted_status.user.name"]
# gephi = gephi[gephi["Target"].str.len() !=0] # filter out tweet that are not retweeted
# gephi[["ID", "label", "Source", "Target", "Timestamp"]].to_csv(
# "/home/rdecoupe/Téléchargements/acquitaine_script_gephi.csv",
# index = False
# )
gephi = df_results
gephi["Source"] = gephi["user.name"]
gephi["Target"] = gephi["retweeted_status.user.name"]
gephi["ID"] = gephi.index
gephi["Timestamp"] = gephi["@timestamp"]
gephi["label"] = gephi["retweeted_status.user.name"]
gephi = gephi[gephi["Target"].str.len() !=0] # filter out tweet that are not retweeted
gephi[["ID", "label", "Source", "Target", "Timestamp"]].to_csv(
"/home/rdecoupe/Téléchargements/acquitaine_script_gephi.csv",
index=False
)
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment