In [48]:
#Load libraries
library(ggplot2)
library(dplyr)
In [108]:
#Load SPON Data
spon_sentiment_all <- na.omit(read.csv("/home/hao/workspace/6thSemester/DataScience/data/SPON_All.csv", fileEncoding="UTF-16"))
head(spon_sentiment_all)
In [109]:
#Load Junge Freiheit Data
jf_sentiment_all <- na.omit(read.csv("/home/hao/workspace/6thSemester/DataScience/data/JF_ALL.csv", fileEncoding="UTF-8"))
head(jf_sentiment_all)
In [110]:
#Load Bild Data
bild_sentiment_all <- na.omit(read.csv("/home/hao/workspace/6thSemester/DataScience/data/BILD_All.csv", fileEncoding="UTF-8"))
head(bild_sentiment_all)
In [111]:
#Defining Method to aggregate positive_abs, neutral_abs, negative_abs to one value called polarity
calc_polarity <- function(positiv, neutral, negativ) {
sum <- positiv + neutral + negativ
polarity <- (positiv - negativ) / sum;
polarity
}
In [112]:
#Group SPON Data by Year
spon_sentiment_byYear <- spon_sentiment_all %>%
group_by(year) %>%
summarise(sum_positiv_abs = sum(positiv_abs),
sum_neutral_abs = sum(neutral_abs),
sum_negativ_abs = sum(negativ_abs),
polarity = calc_polarity(sum_positiv_abs, sum_neutral_abs, sum_negativ_abs),
mean_positiv_rel = mean(positiv_rel),
mean_neutral_rel = mean(neutral_rel),
mean_negativ_rel = mean(negativ_rel),
source = "SPON")
head(spon_sentiment_byYear)
In [113]:
#Group JF Data by Year
jf_sentiment_byYear <- jf_sentiment_all %>%
group_by(year) %>%
summarise(sum_positiv_abs = sum(positiv_abs),
sum_neutral_abs = sum(neutral_abs),
sum_negativ_abs = sum(negativ_abs),
polarity = calc_polarity(sum_positiv_abs, sum_neutral_abs, sum_negativ_abs),
mean_positiv_rel = mean(positiv_rel),
mean_neutral_rel = mean(neutral_rel),
mean_negativ_rel = mean(negativ_rel),
source = "JF")
#filter
jf_sentiment_byYear <- jf_sentiment_byYear[(jf_sentiment_byYear>=2001),]
head(jf_sentiment_byYear)
In [117]:
#Group Bild Data by Year
bild_sentiment_byYear <- bild_sentiment_all %>%
group_by(year) %>%
summarise(sum_positiv_abs = sum(positiv_abs),
sum_neutral_abs = sum(neutral_abs),
sum_negativ_abs = sum(negativ_abs),
polarity = calc_polarity(sum_positiv_abs, sum_neutral_abs, sum_negativ_abs),
mean_positiv_rel = mean(positiv_rel),
mean_neutral_rel = mean(neutral_rel),
mean_negativ_rel = mean(negativ_rel),
source = "BILD")
bild_sentiment_byYear$year <- as.numeric(as.character(bild_sentiment_byYear$year))
head(bild_sentiment_byYear)
In [125]:
#Plotting Polarity of all three News Sites
ggplot() +
#SPON
geom_line(data = spon_sentiment_byYear, aes(x=year, y=polarity, color = source)) +
geom_point(data = spon_sentiment_byYear, aes(x=year, y=polarity, color = source)) +
geom_smooth(data = spon_sentiment_byYear, aes(x=year, y=polarity, color = source), method = 'loess') +
#JF
geom_line(data = jf_sentiment_byYear, aes(x=year, y=polarity, color = source)) +
geom_point(data = jf_sentiment_byYear, aes(x=year, y=polarity, color = source)) +
geom_smooth(data = jf_sentiment_byYear, aes(x=year, y=polarity, color = source), method = 'loess') +
#BILD
geom_line(data = bild_sentiment_byYear, aes(x=year, y=polarity, color = source)) +
geom_point(data = bild_sentiment_byYear, aes(x=year, y=polarity, color = source)) +
geom_smooth(data = bild_sentiment_byYear, aes(x=year, y=polarity, color = source), method = 'loess')
In [ ]: