Skip to content
Snippets Groups Projects
Commit 5553680f authored by Guillaume Di Fatta's avatar Guillaume Di Fatta
Browse files

initial commit

parents
Branches
No related tags found
1 merge request!1initial commit
main.py 0 → 100644
import snscrape.modules.twitter as sntwitter
import pandas as pd
from src.functions import construct_query, convert_date
table = pd.DataFrame(columns=['date', 'tweet'])
terms = ["Metaverse"]
negativeTerms = ["#metaverse"]
filters = []
negativeFilters = ["replies", "links", "retweets", "nativeretweets"]
languages = ["en"]
tweetNumber = 1000
for i, tweet in enumerate(sntwitter.TwitterSearchScraper(query=construct_query(terms, negativeTerms, filters, negativeFilters)).get_items()):
if i > tweetNumber:
break
if (tweet.lang in languages):
dict = {'date': convert_date(tweet.date), 'tweet': tweet.rawContent}
if ("metaverse" in tweet.rawContent.lower()):
table = pd.concat([table, pd.DataFrame.from_records([dict])])
print(i/tweetNumber*100, " %")
table = table.drop_duplicates(subset=["tweet"]).sort_values(by=["tweet"])
table.to_json("output/twitter_data.json", orient="split")
This diff is collapsed.
File added
import datetime as dt
def construct_query(terms, negativeTerms, filters, negativeFilters):
query = ""
for t in terms:
query += t+" "
for nt in negativeTerms:
query += "-"+nt+" "
for f in filters:
query += "filter:"+f+" "
for nf in negativeFilters:
query += "-filter:"+nf+" "
return (query)
def convert_date(date):
return (date.strftime(
"%m/%d/%Y, %H:%M:%S"))
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Please register or to comment