finishes classification scripts
This commit is contained in:
parent
2535683cdc
commit
4e08cde317
@ -43,6 +43,16 @@ import CleanTweets
|
|||||||
#%%
|
#%%
|
||||||
# get datafra,e
|
# get datafra,e
|
||||||
dfClassify = pd.read_csv(senCSVPath, dtype=(object))
|
dfClassify = pd.read_csv(senCSVPath, dtype=(object))
|
||||||
|
def encode_labels(label):
|
||||||
|
if label == 'True':
|
||||||
|
return 'False'
|
||||||
|
elif label == 'False':
|
||||||
|
return 'True'
|
||||||
|
return 0
|
||||||
|
dfClassify['output_label_topicCov'] = dfClassify['output_label_topicCov'].apply(encode_labels)
|
||||||
|
dfClassify.to_csv("/home/michael/Documents/PS/Data/collectTweets/data/OUT/Tweets-Classified-Topic-Results.csv", encoding='utf-8')
|
||||||
|
|
||||||
|
dfClassify = dfClassify[dfClassify['output_label_topicCov']=='True']
|
||||||
|
|
||||||
# dataframe from csv
|
# dataframe from csv
|
||||||
dfClassify['fake'] = False
|
dfClassify['fake'] = False
|
||||||
|
@ -110,3 +110,14 @@ print(f"Time per tweet classification: {timePerTweet}")
|
|||||||
dfClassify.to_csv(senCSVcClassificationResultPath, encoding='utf-8')
|
dfClassify.to_csv(senCSVcClassificationResultPath, encoding='utf-8')
|
||||||
|
|
||||||
# %%
|
# %%
|
||||||
|
## corrections
|
||||||
|
def encode_labels(label):
|
||||||
|
if label == 'real':
|
||||||
|
return 'True'
|
||||||
|
elif label == 'fake':
|
||||||
|
return 'False'
|
||||||
|
return 0
|
||||||
|
dfClassify['output_label_topicCov'] = dfClassify['output_label_topicCov'].apply(encode_labels)
|
||||||
|
dfClassify.to_csv(senCSVcClassificationResultPath, encoding='utf-8')
|
||||||
|
#still wrong, will be corrected in ClassificationFake.py
|
||||||
|
|
||||||
|
Loading…
x
Reference in New Issue
Block a user