Skip to content
Snippets Groups Projects
Select Git revision
  • 4e0c96c59607fd366b7bb2430706351820b2369d
  • main default
  • tp2
  • tp1
  • tp3
  • tp2-correction
  • tp1-correction
  • admins
8 results

Operator.cpython-310.pyc

Blame
  • Forked from an inaccessible project.
    main.py 940 B
    import snscrape.modules.twitter as sntwitter
    import pandas as pd
    
    from src.functions import construct_query, convert_date
    
    table = pd.DataFrame(columns=['date', 'tweet'])
    
    terms = ["Metaverse"]
    negativeTerms = ["#metaverse"]
    
    filters = []
    negativeFilters = ["replies", "links", "retweets", "nativeretweets"]
    
    languages = ["en"]
    
    tweetNumber = 1000
    
    for i, tweet in enumerate(sntwitter.TwitterSearchScraper(query=construct_query(terms, negativeTerms, filters, negativeFilters)).get_items()):
        if i > tweetNumber:
            break
        if (tweet.lang in languages):
            dict = {'date': convert_date(tweet.date), 'tweet': tweet.rawContent}
    
            if ("metaverse" in tweet.rawContent.lower()):
                table = pd.concat([table, pd.DataFrame.from_records([dict])])
    
        print(i/tweetNumber*100, " %")
    
    
    table = table.drop_duplicates(subset=["tweet"]).sort_values(by=["tweet"])
    
    table.to_json("output/twitter_data.json", orient="split")