# -*- coding: utf-8 -*- """Data_Gathering_Twint.ipynb Automatically generated by Colaboratory. Original file is located at https://colab.research.google.com/drive/1zV6s2FhvQCmyNh0uyknfm47WATAOihbU """ from google.colab import drive drive.mount('/content/drive') !git clone https://github.com/twintproject/twint.git import os os.chdir("/content/twint") !pip freeze > requirements.txt !pip install . !pip install -U git+https://github.com/cyxv/twint.git@master !pip install nest_asyncio !pip3 install twint # Import required libraries import nest_asyncio nest_asyncio.apply() import pandas as pd import twint import pandas as pd import re # add some tweets with depressed and depression tags, for a particular year depress_tags = ["#depressed", "#anxiety", "#depression", "#suicide", "#mentalhealth" "#loneliness", "#hopelessness", "#itsokaynottobeokay"] content = {} for i in range(len(depress_tags)): print(depress_tags[i]) c = twint.Config() c.Format = "Tweet id: {id} | Tweet: {tweet}" c.Search = depress_tags[i] c.Limit = 1000 c.Year = 2019 c.Lang = "en" c.Store_csv = True c.Store_Object = True c.Output = "/content/drive/MyDrive/NLP/Depression_Detection/depressive_en_2019.csv" c.Hide_output = True c.Stats = True c.Lowercase = True c.Filter_retweets = True twint.run.Search(c) # add some tweets with depressed and depression tags, for a particular year depress_tags = ["#depressed", "#depression", "#loneliness", "#hopelessness"] content = {} for i in range(len(depress_tags)): print(depress_tags[i]) c = twint.Config() c.Format = "Tweet id: {id} | Tweet: {tweet}" c.Search = depress_tags[i] c.Limit = 1000 c.Year = 2020 c.Store_csv = True c.Store_json = True c.Output = "/content/drive/MyDrive/NLP/Depression_Detection/dataset_depression.json" c.Hide_output = True c.Stats = True c.Lowercase = True c.Filter_retweets = True twint.run.Search(c)