changes folder structure of in- and output files
This commit is contained in:
parent
02c3d055bd
commit
27746cd886
@ -69,8 +69,11 @@ wd = "/home/michael/Documents/PS/Data/collectTweets/"
|
|||||||
# WD Server
|
# WD Server
|
||||||
# wd = '/home/yunohost.multimedia/polsoc/Politics & Society/TweetCollection/'
|
# wd = '/home/yunohost.multimedia/polsoc/Politics & Society/TweetCollection/'
|
||||||
|
|
||||||
|
# datafile input directory
|
||||||
|
di = "data/IN/"
|
||||||
|
|
||||||
# Tweet-datafile output directory
|
# Tweet-datafile output directory
|
||||||
td = "data/tweets/"
|
td = "data/OUT/"
|
||||||
|
|
||||||
# Name of file that all tweets will be written to
|
# Name of file that all tweets will be written to
|
||||||
file_alltweets = "ALL-SENATORS-TWEETS.csv"
|
file_alltweets = "ALL-SENATORS-TWEETS.csv"
|
||||||
@ -171,9 +174,9 @@ print("---")
|
|||||||
# read keywords from a file and write to list.
|
# read keywords from a file and write to list.
|
||||||
keywords = []
|
keywords = []
|
||||||
# Remove duplicate Keywords and save all non-duplicates to 'data/keywords.txt'
|
# Remove duplicate Keywords and save all non-duplicates to 'data/keywords.txt'
|
||||||
deDupe("data/keywords-raw.txt", "data/keywords.txt")
|
deDupe(f"{di}keywords-raw.txt", f"{di}keywords.txt")
|
||||||
# Read the keywords from a file
|
# Read the keywords from a file
|
||||||
with open("data/keywords.txt", "r") as file:
|
with open(f"{di}keywords.txt", "r") as file:
|
||||||
lines = file.readlines()
|
lines = file.readlines()
|
||||||
for line in lines:
|
for line in lines:
|
||||||
keyword = line.strip() # Remove the newline character
|
keyword = line.strip() # Remove the newline character
|
||||||
|
@ -1,140 +0,0 @@
|
|||||||
Coronavirus
|
|
||||||
Koronavirus
|
|
||||||
Corona
|
|
||||||
CDC
|
|
||||||
Wuhancoronavirus
|
|
||||||
Wuhanlockdown
|
|
||||||
Ncov
|
|
||||||
Wuhan
|
|
||||||
N95
|
|
||||||
Kungflu
|
|
||||||
Epidemic
|
|
||||||
outbreak
|
|
||||||
Sinophobia
|
|
||||||
China
|
|
||||||
covid-19
|
|
||||||
corona virus
|
|
||||||
covid
|
|
||||||
covid19
|
|
||||||
sars-cov-2
|
|
||||||
COVIDー19
|
|
||||||
COVD
|
|
||||||
pandemic
|
|
||||||
coronapocalypse
|
|
||||||
canceleverything
|
|
||||||
Coronials
|
|
||||||
SocialDistancingNow
|
|
||||||
Social Distancing
|
|
||||||
SocialDistancing
|
|
||||||
panicbuy
|
|
||||||
panic buy
|
|
||||||
panicbuying
|
|
||||||
panic buying
|
|
||||||
14DayQuarantine
|
|
||||||
DuringMy14DayQuarantine
|
|
||||||
panic shop
|
|
||||||
panic shopping
|
|
||||||
panicshop
|
|
||||||
InMyQuarantineSurvivalKit
|
|
||||||
panic-buy
|
|
||||||
panic-shop
|
|
||||||
coronakindness
|
|
||||||
quarantinelife
|
|
||||||
chinese virus
|
|
||||||
chinesevirus
|
|
||||||
stayhomechallenge
|
|
||||||
stay home challenge
|
|
||||||
sflockdown
|
|
||||||
DontBeASpreader
|
|
||||||
lockdown
|
|
||||||
lock down
|
|
||||||
shelteringinplace
|
|
||||||
sheltering in place
|
|
||||||
staysafestayhome
|
|
||||||
stay safe stay home
|
|
||||||
trumppandemic
|
|
||||||
trump pandemic
|
|
||||||
flattenthecurve
|
|
||||||
flatten the curve
|
|
||||||
china virus
|
|
||||||
chinavirus
|
|
||||||
quarentinelife
|
|
||||||
PPEshortage
|
|
||||||
saferathome
|
|
||||||
stayathome
|
|
||||||
stay at home
|
|
||||||
stay home
|
|
||||||
stayhome
|
|
||||||
GetMePPE
|
|
||||||
covidiot
|
|
||||||
epitwitter
|
|
||||||
pandemie
|
|
||||||
wear a mask
|
|
||||||
wearamask
|
|
||||||
kung flu
|
|
||||||
covididiot
|
|
||||||
COVID__19
|
|
||||||
omicron
|
|
||||||
variant
|
|
||||||
vaccine
|
|
||||||
travel ban
|
|
||||||
corona
|
|
||||||
coronavirus
|
|
||||||
sarscov2
|
|
||||||
sars cov2
|
|
||||||
sars cov 2
|
|
||||||
covid_19
|
|
||||||
ncov
|
|
||||||
ncov2019
|
|
||||||
2019-ncov
|
|
||||||
pandemic 2019ncov
|
|
||||||
2019ncov
|
|
||||||
quarantine
|
|
||||||
flattening the curve
|
|
||||||
flatteningthecurve
|
|
||||||
flattenthecurve
|
|
||||||
hand sanitizer
|
|
||||||
handsanitizer
|
|
||||||
social distancing
|
|
||||||
socialdistancing
|
|
||||||
work from home
|
|
||||||
workfromhome
|
|
||||||
working from home
|
|
||||||
workingfromhome
|
|
||||||
ppe
|
|
||||||
n95
|
|
||||||
covidiots
|
|
||||||
herd immunity
|
|
||||||
herdimmunity
|
|
||||||
pneumonia
|
|
||||||
wuhan virus
|
|
||||||
wuhanvirus
|
|
||||||
kungflu
|
|
||||||
vaccines
|
|
||||||
corona vaccine
|
|
||||||
corona vaccines
|
|
||||||
coronavaccine
|
|
||||||
coronavaccines
|
|
||||||
face shield
|
|
||||||
faceshield
|
|
||||||
face shields
|
|
||||||
faceshields
|
|
||||||
health worker
|
|
||||||
healthworker
|
|
||||||
health workers
|
|
||||||
healthworkers
|
|
||||||
stayhomestaysafe
|
|
||||||
coronaupdate
|
|
||||||
frontlineheroes
|
|
||||||
coronawarriors
|
|
||||||
homeschool
|
|
||||||
homeschooling
|
|
||||||
hometasking
|
|
||||||
masks4all
|
|
||||||
wfh
|
|
||||||
wash ur hands
|
|
||||||
wash your hands
|
|
||||||
washurhands
|
|
||||||
washyourhands
|
|
||||||
selfisolating
|
|
||||||
self isolating
|
|
24
data/tweets/.gitignore
vendored
24
data/tweets/.gitignore
vendored
@ -1,24 +0,0 @@
|
|||||||
/ALL-SENATORS-LONG-LONG.csv
|
|
||||||
/ALL-SENATORS.csv
|
|
||||||
/CoryGardner-LONG.csv
|
|
||||||
/CoryGardner.csv
|
|
||||||
/DavidPerdueGA-LONG.csv
|
|
||||||
/DavidPerdueGA.csv
|
|
||||||
/DougJones-LONG.csv
|
|
||||||
/DougJones.csv
|
|
||||||
/KLoeffler-LONG.csv
|
|
||||||
/KLoeffler.csv
|
|
||||||
/MarthaMcSallyAZ-LONG.csv
|
|
||||||
/MarthaMcSallyAZ.csv
|
|
||||||
/SenAlexander-LONG.csv
|
|
||||||
/SenAlexander.csv
|
|
||||||
/SenPatRoberts-LONG.csv
|
|
||||||
/SenPatRoberts.csv
|
|
||||||
/SenatorEnzi-LONG.csv
|
|
||||||
/SenatorEnzi.csv
|
|
||||||
/SenatorIsakson-LONG.csv
|
|
||||||
/SenatorIsakson.csv
|
|
||||||
/SenatorTomUdall-LONG.csv
|
|
||||||
/SenatorTomUdall.csv
|
|
||||||
/VP-LONG.csv
|
|
||||||
/VP.csv
|
|
Loading…
x
Reference in New Issue
Block a user