changes folder structure of in- and output files
This commit is contained in:
parent
02c3d055bd
commit
27746cd886
@ -69,8 +69,11 @@ wd = "/home/michael/Documents/PS/Data/collectTweets/"
|
||||
# WD Server
|
||||
# wd = '/home/yunohost.multimedia/polsoc/Politics & Society/TweetCollection/'
|
||||
|
||||
# datafile input directory
|
||||
di = "data/IN/"
|
||||
|
||||
# Tweet-datafile output directory
|
||||
td = "data/tweets/"
|
||||
td = "data/OUT/"
|
||||
|
||||
# Name of file that all tweets will be written to
|
||||
file_alltweets = "ALL-SENATORS-TWEETS.csv"
|
||||
@ -171,9 +174,9 @@ print("---")
|
||||
# read keywords from a file and write to list.
|
||||
keywords = []
|
||||
# Remove duplicate Keywords and save all non-duplicates to 'data/keywords.txt'
|
||||
deDupe("data/keywords-raw.txt", "data/keywords.txt")
|
||||
deDupe(f"{di}keywords-raw.txt", f"{di}keywords.txt")
|
||||
# Read the keywords from a file
|
||||
with open("data/keywords.txt", "r") as file:
|
||||
with open(f"{di}keywords.txt", "r") as file:
|
||||
lines = file.readlines()
|
||||
for line in lines:
|
||||
keyword = line.strip() # Remove the newline character
|
||||
|
@ -1,140 +0,0 @@
|
||||
Coronavirus
|
||||
Koronavirus
|
||||
Corona
|
||||
CDC
|
||||
Wuhancoronavirus
|
||||
Wuhanlockdown
|
||||
Ncov
|
||||
Wuhan
|
||||
N95
|
||||
Kungflu
|
||||
Epidemic
|
||||
outbreak
|
||||
Sinophobia
|
||||
China
|
||||
covid-19
|
||||
corona virus
|
||||
covid
|
||||
covid19
|
||||
sars-cov-2
|
||||
COVIDー19
|
||||
COVD
|
||||
pandemic
|
||||
coronapocalypse
|
||||
canceleverything
|
||||
Coronials
|
||||
SocialDistancingNow
|
||||
Social Distancing
|
||||
SocialDistancing
|
||||
panicbuy
|
||||
panic buy
|
||||
panicbuying
|
||||
panic buying
|
||||
14DayQuarantine
|
||||
DuringMy14DayQuarantine
|
||||
panic shop
|
||||
panic shopping
|
||||
panicshop
|
||||
InMyQuarantineSurvivalKit
|
||||
panic-buy
|
||||
panic-shop
|
||||
coronakindness
|
||||
quarantinelife
|
||||
chinese virus
|
||||
chinesevirus
|
||||
stayhomechallenge
|
||||
stay home challenge
|
||||
sflockdown
|
||||
DontBeASpreader
|
||||
lockdown
|
||||
lock down
|
||||
shelteringinplace
|
||||
sheltering in place
|
||||
staysafestayhome
|
||||
stay safe stay home
|
||||
trumppandemic
|
||||
trump pandemic
|
||||
flattenthecurve
|
||||
flatten the curve
|
||||
china virus
|
||||
chinavirus
|
||||
quarentinelife
|
||||
PPEshortage
|
||||
saferathome
|
||||
stayathome
|
||||
stay at home
|
||||
stay home
|
||||
stayhome
|
||||
GetMePPE
|
||||
covidiot
|
||||
epitwitter
|
||||
pandemie
|
||||
wear a mask
|
||||
wearamask
|
||||
kung flu
|
||||
covididiot
|
||||
COVID__19
|
||||
omicron
|
||||
variant
|
||||
vaccine
|
||||
travel ban
|
||||
corona
|
||||
coronavirus
|
||||
sarscov2
|
||||
sars cov2
|
||||
sars cov 2
|
||||
covid_19
|
||||
ncov
|
||||
ncov2019
|
||||
2019-ncov
|
||||
pandemic 2019ncov
|
||||
2019ncov
|
||||
quarantine
|
||||
flattening the curve
|
||||
flatteningthecurve
|
||||
flattenthecurve
|
||||
hand sanitizer
|
||||
handsanitizer
|
||||
social distancing
|
||||
socialdistancing
|
||||
work from home
|
||||
workfromhome
|
||||
working from home
|
||||
workingfromhome
|
||||
ppe
|
||||
n95
|
||||
covidiots
|
||||
herd immunity
|
||||
herdimmunity
|
||||
pneumonia
|
||||
wuhan virus
|
||||
wuhanvirus
|
||||
kungflu
|
||||
vaccines
|
||||
corona vaccine
|
||||
corona vaccines
|
||||
coronavaccine
|
||||
coronavaccines
|
||||
face shield
|
||||
faceshield
|
||||
face shields
|
||||
faceshields
|
||||
health worker
|
||||
healthworker
|
||||
health workers
|
||||
healthworkers
|
||||
stayhomestaysafe
|
||||
coronaupdate
|
||||
frontlineheroes
|
||||
coronawarriors
|
||||
homeschool
|
||||
homeschooling
|
||||
hometasking
|
||||
masks4all
|
||||
wfh
|
||||
wash ur hands
|
||||
wash your hands
|
||||
washurhands
|
||||
washyourhands
|
||||
selfisolating
|
||||
self isolating
|
24
data/tweets/.gitignore
vendored
24
data/tweets/.gitignore
vendored
@ -1,24 +0,0 @@
|
||||
/ALL-SENATORS-LONG-LONG.csv
|
||||
/ALL-SENATORS.csv
|
||||
/CoryGardner-LONG.csv
|
||||
/CoryGardner.csv
|
||||
/DavidPerdueGA-LONG.csv
|
||||
/DavidPerdueGA.csv
|
||||
/DougJones-LONG.csv
|
||||
/DougJones.csv
|
||||
/KLoeffler-LONG.csv
|
||||
/KLoeffler.csv
|
||||
/MarthaMcSallyAZ-LONG.csv
|
||||
/MarthaMcSallyAZ.csv
|
||||
/SenAlexander-LONG.csv
|
||||
/SenAlexander.csv
|
||||
/SenPatRoberts-LONG.csv
|
||||
/SenPatRoberts.csv
|
||||
/SenatorEnzi-LONG.csv
|
||||
/SenatorEnzi.csv
|
||||
/SenatorIsakson-LONG.csv
|
||||
/SenatorIsakson.csv
|
||||
/SenatorTomUdall-LONG.csv
|
||||
/SenatorTomUdall.csv
|
||||
/VP-LONG.csv
|
||||
/VP.csv
|
Loading…
x
Reference in New Issue
Block a user