In [40]:
library(dplyr)
In [41]:
quality_prediction_and_page_views <- read.table("../results/sql_queries/entity_views_and_aggregated_revisions/entity_views_and_aggregated_revisions_and_quality_scoring_correlation.tsv", header=FALSE, sep="\t")
In [42]:
colnames(quality_prediction_and_page_views) <- c('yymm','spearman_corr_of_views_versus_quality', 'p')
In [43]:
monthly_bot_edits <- read.table("../results/wikidata_page_revisions_with_timestamp_bot_info/monthly_bot_edits_converted.tsv", header=FALSE, sep="\t")
In [44]:
colnames(monthly_bot_edits) <- c('yyyy','mm', 'yymm', 'prev_month_bot_edits_over_total', 'prev_month_bot_edits', 'prev_month_edits')
In [45]:
quality_predictions_and_page_views_and_monthly_bot_edits <- merge(monthly_bot_edits, quality_prediction_and_page_views, by='yymm')[c('yymm','prev_month_bot_edits_over_total', 'prev_month_bot_edits', 'prev_month_edits', 'spearman_corr_of_views_versus_quality', 'p')]
In [46]:
sorted_quality_prediction_and_page_views <- dplyr::arrange(quality_prediction_and_page_views, yymm)
In [47]:
sorted_quality_predictions_and_page_views_and_monthly_bot_edits <- dplyr::arrange(quality_predictions_and_page_views_and_monthly_bot_edits, yymm)
In [48]:
sorted_quality_prediction_and_page_views$row_number <- matrix(1:57,57,1)
In [49]:
sorted_quality_predictions_and_page_views_and_monthly_bot_edits$row_number <- matrix(1:56,56,1)
In [50]:
head(sorted_quality_predictions_and_page_views_and_monthly_bot_edits, n=60)
In [51]:
plot(sorted_quality_predictions_and_page_views_and_monthly_bot_edits$row_number, sorted_quality_predictions_and_page_views_and_monthly_bot_edits$spearman_corr_of_views_versus_quality, xlab="Month", ylab="Spearman Correlation of Views versus Quality")
abline(lm(sorted_quality_prediction_and_page_views$spearman_corr_of_views_versus_quality ~ sorted_quality_prediction_and_page_views$row_number))
In [52]:
cor(sorted_quality_prediction_and_page_views$row_number,sorted_quality_prediction_and_page_views$spearman_corr_of_views_versus_quality, method="spearman")
In [53]:
summary(lm(sorted_quality_prediction_and_page_views$spearman_corr_of_views_versus_quality ~ sorted_quality_prediction_and_page_views$row_number))
In [54]:
plot(sorted_quality_predictions_and_page_views_and_monthly_bot_edits$row_number, sorted_quality_predictions_and_page_views_and_monthly_bot_edits$prev_month_bot_edits_over_total, xlab="Month", ylab="Bot edits over total")
abline(lm(sorted_quality_predictions_and_page_views_and_monthly_bot_edits$prev_month_bot_edits_over_total ~ sorted_quality_predictions_and_page_views_and_monthly_bot_edits$row_number))
In [55]:
cor(sorted_quality_predictions_and_page_views_and_monthly_bot_edits$row_number, sorted_quality_predictions_and_page_views_and_monthly_bot_edits$prev_month_bot_edits_over_total, method="spearman")
In [56]:
summary(lm(sorted_quality_predictions_and_page_views_and_monthly_bot_edits$prev_month_bot_edits_over_total ~ sorted_quality_predictions_and_page_views_and_monthly_bot_edits$row_number))
In [57]:
cor(sorted_quality_predictions_and_page_views_and_monthly_bot_edits$spearman_corr_of_views_versus_quality, sorted_quality_predictions_and_page_views_and_monthly_bot_edits$prev_month_bot_edits_over_total, method="spearman")
In [58]:
summary(lm(sorted_quality_predictions_and_page_views_and_monthly_bot_edits$prev_month_bot_edits_over_total ~ sorted_quality_predictions_and_page_views_and_monthly_bot_edits$spearman_corr_of_views_versus_quality))
In [ ]: