In [1]:
library(data.table)
library(ggplot2)
library(viridis)


Loading required package: viridisLite

In [72]:
options(scipen = 999)

In [73]:
revision_agent_types_by_month <- read.table("../../../results/misalignment_edit_types_tables_and_queries/attribute_aggregations.tsv", header=TRUE, sep="\t")

In [74]:
revision_all_agent_types_by_month <- read.table("../../../results/misalignment_edit_types_tables_and_queries/attribute_aggregations.tsv", header=TRUE, sep="\t")

In [75]:
summary(revision_all_agent_types_by_month)


      year          month           bot_edit        quickstatements  
 Min.   :2012   Min.   : 1.000   Min.   :     700   Min.   :      0  
 1st Qu.:2014   1st Qu.: 3.000   1st Qu.: 3262839   1st Qu.:      0  
 Median :2015   Median : 6.000   Median : 4773374   Median :      0  
 Mean   :2015   Mean   : 6.357   Mean   : 5132675   Mean   : 385516  
 3rd Qu.:2016   3rd Qu.: 9.250   3rd Qu.: 6548053   3rd Qu.: 719013  
 Max.   :2017   Max.   :12.000   Max.   :13948677   Max.   :2259076  
    petscan         autolist2         autoedit      labellister  
 Min.   :     0   Min.   :     0   Min.   :    0   Min.   :   0  
 1st Qu.:     0   1st Qu.:     0   1st Qu.: 2800   1st Qu.:1984  
 Median :     0   Median :     0   Median : 3511   Median :3199  
 Mean   : 92311   Mean   : 47141   Mean   : 3959   Mean   :3196  
 3rd Qu.:  3516   3rd Qu.:     0   3rd Qu.: 4443   3rd Qu.:4126  
 Max.   :982098   Max.   :748752   Max.   :19225   Max.   :9404  
  itemcreator      dragrefjs            lcjs          wikidatagame  
 Min.   :    0   Min.   :    0.0   Min.   :   0.00   Min.   :    0  
 1st Qu.:    0   1st Qu.:    0.0   1st Qu.:   0.75   1st Qu.:    0  
 Median :    0   Median :    0.0   Median : 427.50   Median :    0  
 Mean   : 1441   Mean   :  892.5   Mean   : 771.59   Mean   : 8049  
 3rd Qu.:    0   3rd Qu.:  591.8   3rd Qu.:1273.00   3rd Qu.:17229  
 Max.   :42957   Max.   :10702.0   Max.   :4852.00   Max.   :41743  
 wikidataprimary   mixnmatch     distributedgame  nameguzzler     
 Min.   :    0   Min.   :    0   Min.   :    0   Min.   :    0.0  
 1st Qu.:    0   1st Qu.:    0   1st Qu.:    0   1st Qu.:  497.2  
 Median :    0   Median :    0   Median :    0   Median : 1456.5  
 Mean   : 6396   Mean   : 5764   Mean   : 3965   Mean   : 2618.2  
 3rd Qu.: 8226   3rd Qu.:10744   3rd Qu.: 6504   3rd Qu.: 4162.0  
 Max.   :39648   Max.   :29487   Max.   :34273   Max.   :14077.0  
    mergejs        reasonator       duplicity   tabernacle     Widar       
 Min.   :    0   Min.   :   0.0   Min.   :0   Min.   :0    Min.   : 0.000  
 1st Qu.: 7311   1st Qu.:   0.0   1st Qu.:0   1st Qu.:0    1st Qu.: 0.000  
 Median :10491   Median :   0.0   Median :0   Median :0    Median : 4.000  
 Mean   : 9657   Mean   : 217.7   Mean   :0   Mean   :0    Mean   : 6.089  
 3rd Qu.:12229   3rd Qu.: 181.0   3rd Qu.:0   3rd Qu.:0    3rd Qu.: 8.250  
 Max.   :25081   Max.   :3203.0   Max.   :0   Max.   :0    Max.   :52.000  
      reCh             HHVM             PAWS            Kaspar      
 Min.   : 0.000   Min.   :0.0000   Min.   :0.0000   Min.   :  0.00  
 1st Qu.: 1.000   1st Qu.:0.0000   1st Qu.:0.0000   1st Qu.:  9.00  
 Median : 5.500   Median :0.0000   Median :0.0000   Median : 16.50  
 Mean   : 6.554   Mean   :0.2321   Mean   :0.3036   Mean   : 43.48  
 3rd Qu.:10.000   3rd Qu.:0.0000   3rd Qu.:0.0000   3rd Qu.: 46.75  
 Max.   :20.000   Max.   :5.0000   Max.   :5.0000   Max.   :483.00  
   itemFinder      rgCh       not_flagged_elsewhere_quickstatments_bot_account
 Min.   :0    Min.   :0.000   Min.   :0.00000                                 
 1st Qu.:0    1st Qu.:0.000   1st Qu.:0.00000                                 
 Median :0    Median :0.000   Median :0.00000                                 
 Mean   :0    Mean   :1.321   Mean   :0.07143                                 
 3rd Qu.:0    3rd Qu.:2.000   3rd Qu.:0.00000                                 
 Max.   :0    Max.   :8.000   Max.   :3.00000                                 
 other_semi_automated_edit_since_change_tag   anon_edit       human_edit     
 Min.   :      0                            Min.   :  517   Min.   :  38989  
 1st Qu.:   5104                            1st Qu.:29768   1st Qu.: 590023  
 Median : 539215                            Median :34769   Median : 695782  
 Mean   : 633039                            Mean   :35411   Mean   : 707740  
 3rd Qu.: 948789                            3rd Qu.:43007   3rd Qu.: 885609  
 Max.   :2797426                            Max.   :81582   Max.   :1117892  
 tool_bot_like_edit human_bot_like_edit anon_bot_like_edit
 Min.   :     0.0   Min.   :     9.0    Min.   :   0.00   
 1st Qu.:   213.2   1st Qu.:   879.5    1st Qu.:   0.00   
 Median : 13835.5   Median :  2895.5    Median :   3.00   
 Mean   : 53178.3   Mean   : 12012.3    Mean   : 446.89   
 3rd Qu.: 94454.0   3rd Qu.: 11678.8    3rd Qu.:  32.75   
 Max.   :252695.0   Max.   :151910.0    Max.   :7034.00   

In [76]:
attributes(summary(revision_all_agent_types_by_month$bot_edit))
# head(revision_all_agent_types_by_month, n=60)


$names
  1. 'Min.'
  2. '1st Qu.'
  3. 'Median'
  4. 'Mean'
  5. '3rd Qu.'
  6. 'Max.'
$class
  1. 'summaryDefault'
  2. 'table'

In [77]:
revision_all_agent_types_by_month_ordered_by_year_month = revision_all_agent_types_by_month[order(revision_all_agent_types_by_month$year, revision_all_agent_types_by_month$year),]
revision_all_agent_types_by_month_ordered_by_year_month <- revision_all_agent_types_by_month_ordered_by_year_month[1:55,]
revision_all_agent_types_by_month_ordered_by_year_month$month_order = 1:55

quickstatements = data.table(revision_all_agent_types_by_month_ordered_by_year_month$month_order)
quickstatements$edit = revision_all_agent_types_by_month_ordered_by_year_month$quickstatements
quickstatements$group = "quickstatements"

petscan = data.table(revision_all_agent_types_by_month_ordered_by_year_month$month_order)
petscan$edit = revision_all_agent_types_by_month_ordered_by_year_month$petscan
petscan$group = "petscan"

autolist2 = data.table(revision_all_agent_types_by_month_ordered_by_year_month$month_order)
autolist2$edit = revision_all_agent_types_by_month_ordered_by_year_month$autolist2
autolist2$group = "autolist2"

autoedit = data.table(revision_all_agent_types_by_month_ordered_by_year_month$month_order)
autoedit$edit = revision_all_agent_types_by_month_ordered_by_year_month$autoedit
autoedit$group = "autoedit"

labellister  = data.table(revision_all_agent_types_by_month_ordered_by_year_month$month_order)
labellister$edit = revision_all_agent_types_by_month_ordered_by_year_month$labellister
labellister$group = "labellister"

itemcreator  = data.table(revision_all_agent_types_by_month_ordered_by_year_month$month_order)
itemcreator$edit = revision_all_agent_types_by_month_ordered_by_year_month$itemcreator
itemcreator$group = "itemcreator"

dragrefjs  = data.table(revision_all_agent_types_by_month_ordered_by_year_month$month_order)
dragrefjs$edit = revision_all_agent_types_by_month_ordered_by_year_month$dragrefjs
dragrefjs$group = "dragrefjs"

lcjs   = data.table(revision_all_agent_types_by_month_ordered_by_year_month$month_order)
lcjs$edit = revision_all_agent_types_by_month_ordered_by_year_month$lcjs 
lcjs$group = "lcjs "

wikidatagame  = data.table(revision_all_agent_types_by_month_ordered_by_year_month$month_order)
wikidatagame$edit = revision_all_agent_types_by_month_ordered_by_year_month$wikidatagame
wikidatagame$group = "wikidatagame"

wikidataprimary  = data.table(revision_all_agent_types_by_month_ordered_by_year_month$month_order)
wikidataprimary$edit = revision_all_agent_types_by_month_ordered_by_year_month$wikidataprimary
wikidataprimary$group = "wikidataprimary"

mixnmatch  = data.table(revision_all_agent_types_by_month_ordered_by_year_month$month_order)
mixnmatch$edit = revision_all_agent_types_by_month_ordered_by_year_month$mixnmatch
mixnmatch$group = "mixnmatch"

distributedgame  = data.table(revision_all_agent_types_by_month_ordered_by_year_month$month_order)
distributedgame$edit = revision_all_agent_types_by_month_ordered_by_year_month$distributedgame
distributedgame$group = "distributedgame"

nameguzzler  = data.table(revision_all_agent_types_by_month_ordered_by_year_month$month_order)
nameguzzler$edit = revision_all_agent_types_by_month_ordered_by_year_month$nameguzzler
nameguzzler$group = "nameguzzler"

mergejs  = data.table(revision_all_agent_types_by_month_ordered_by_year_month$month_order)
mergejs$edit = revision_all_agent_types_by_month_ordered_by_year_month$mergejs
mergejs$group = "mergejs"


semi_automated_edits_grouped_by_agent_type = rbind(rbind(rbind(rbind(rbind(rbind(rbind(rbind(rbind(rbind(rbind(rbind(rbind(
    quickstatements,
    petscan),
    autolist2),
    autoedit),
    labellister),
    itemcreator),
    dragrefjs),
    lcjs),
    wikidatagame),                                                                             
    wikidataprimary), 
    mixnmatch),
    distributedgame),
    nameguzzler),
    mergejs)

colnames(semi_automated_edits_grouped_by_agent_type) = c('month_order', 'edits', 'group')
head(semi_automated_edits_grouped_by_agent_type)


month_ordereditsgroup
1 0 quickstatements
2 0 quickstatements
3 0 quickstatements
4 0 quickstatements
5 0 quickstatements
6 0 quickstatements

In [78]:
ggplot(semi_automated_edits_grouped_by_agent_type,
       aes(x=month_order, y=edits, color=group, linetype=group)) + geom_point() + geom_line() +
ggtitle("Semi-Automated Agent Type By Month") +
scale_color_viridis(discrete=TRUE)



In [79]:
revision_agent_types_by_month$semi_automated = 
    revision_agent_types_by_month$quickstatements +
    revision_agent_types_by_month$petscan +
    revision_agent_types_by_month$autolist2 +
    revision_agent_types_by_month$autoedit +
    revision_agent_types_by_month$labellister +
    revision_agent_types_by_month$itemcreator +
    revision_agent_types_by_month$dragrefjs +
    revision_agent_types_by_month$lcjs +
    revision_agent_types_by_month$wikidatagame +
    revision_agent_types_by_month$wikidataprimary +
    revision_agent_types_by_month$mixnmatch +
    revision_agent_types_by_month$distributedgame +
    revision_agent_types_by_month$nameguzzler +
    revision_agent_types_by_month$mergejs +
    revision_agent_types_by_month$reasonator +
    revision_agent_types_by_month$duplicity +
    revision_agent_types_by_month$tabernacle +
    revision_agent_types_by_month$Widar +
    revision_agent_types_by_month$reCh +
    revision_agent_types_by_month$HHVM +
    revision_agent_types_by_month$PAWS +
    revision_agent_types_by_month$Kaspar +
    revision_agent_types_by_month$itemFinder +
    revision_agent_types_by_month$rgCh +
    revision_agent_types_by_month$not_flagged_elsewhere_quickstatments_bot_account +
    revision_agent_types_by_month$other_semi_automated_edit_since_change_tag +
    revision_agent_types_by_month$tool_bot_like_edit
    





revision_agent_types_by_month_ordered_by_year_month = revision_agent_types_by_month[order(revision_agent_types_by_month$year, revision_agent_types_by_month$month),]
revision_agent_types_by_month_ordered_by_year_month <- revision_agent_types_by_month_ordered_by_year_month[1:55,]
revision_agent_types_by_month_ordered_by_year_month$month_order = 1:55
head(revision_agent_types_by_month_ordered_by_year_month, n=60)
# head(revision_agent_types_by_month_ordered_by_year_month, n=60)


yearmonthbot_editquickstatementspetscanautolist2autoeditlabellisteritemcreatordragrefjsrgChnot_flagged_elsewhere_quickstatments_bot_accountother_semi_automated_edit_since_change_taganon_edithuman_edittool_bot_like_edithuman_bot_like_editanon_bot_like_editsemi_automatedmonth_order
192012 11 700 0 0 0 0 0 0 0 0 0 0 517 263987 0 6887 0 0 1
202012 12 183629 0 0 0 18041 8063 0 0 0 0 0 2795 205204 0 673 0 26114 2
212013 1 1932349 0 0 0 19225 4528 0 0 0 0 0 2216 170870 0 15448 0 23754 3
222013 2 2285161 0 0 0 3741 3875 0 0 0 0 0 2073 183928 2 1273 0 7620 4
232013 3 2264112 0 0 0 2574 3411 0 0 0 0 0 8211 347624 0 2023 0 5991 5
242013 4 8067371 0 0 0 3326 4805 0 0 0 0 0 31878 808957 0 2727 0 8141 6
252013 5 13276100 0 0 0 0 0 0 0 0 0 0 42922 688842 0 6341 7 5 7
262013 6 13948677 0 0 0 0 0 0 0 0 0 0 42439 833282 0 4837 3 14 8
272013 7 3789628 0 0 0 0 0 0 0 0 0 0 55130 748370 0 839 7034 17 9
282013 8 8292060 0 0 0 0 0 0 0 0 0 0 37204 645670 0 12011 2130 11 10
292013 9 4028693 0 0 0 830 492 0 0 0 0 0 38752 687995 0 14690 4372 5052 11
302013 10 5075148 0 0 0 2982 3308 0 0 0 0 0 35374 676644 145 17728 1256 16546 12
312013 11 8359407 0 0 0 3184 2513 0 0 0 0 0 33368 466875 30 4058 43 15943 13
322013 12 6546802 0 0 0 3332 5149 0 0 0 0 0 34104 795749 236 1212 0 25402 14
332014 1 5576195 0 0 0 2593 9404 0 0 0 0 58310 27071 664747 11 674 35 85784 15
342014 2 8170379 0 0 0 3272 6634 0 0 0 0 91027 26425 672357 27729 9 19 147604 16
352014 3 4989090 0 0 0 4477 5534 0 0 1 0 117618 32945 625223 1291 2467 7 150195 17
362014 4 4747388 0 0 0 3364 3515 0 0 0 0 133952 35156 499857 1367 1279 1369 159416 18
372014 5 4263744 0 0 0 3995 4222 0 0 0 0 411027 34794 510866 6335 676 16 444981 19
382014 6 9239076 0 0 0 4600 5372 0 0 0 0 940944 43263 525234 7075 4898 0 987045 20
392014 7 4174522 0 0 0 5615 4094 0 0 0 0 1091168 33562 506274 14826 484 0 1137392 21
402014 8 3908321 0 0 0 3465 4331 0 0 0 0 1516042 37148 615219 12372 5091 0 1554529 22
412014 9 3313688 0 0 0 3590 4935 0 0 0 0 1101364 33585 596388 1297 5138 0 1132529 23
422014 10 3244385 0 0 0 3278 3268 0 0 0 0 1119244 41515 624790 13839 9068 0 1159231 24
432014 11 6345968 0 0 0 3656 3813 0 0 4 0 1370291 34137 541967 5382 3827 0 1398438 25
442014 12 6551805 0 0 0 2134 3200 0 0 0 0 873115 53068 555766 914 20633 2210 896241 26
452015 1 4767293 0 0 0 2592 2958 0 0 2 0 790679 36567 570928 1018 2972 3 810232 27
462015 2 4355602 0 0 0 4432 5294 0 0 2 0 932011 38226 666686 10055 168 0 961464 28
472015 3 3621741 0 0 0 5525 4781 0 0 0 0 838063 29872 695028 30219 378 0 886608 29
482015 4 4906989 0 0 0 3081 3672 0 0 0 0 899655 33464 696535 7582 40992 0 928413 30
492015 5 2495798 0 0 0 5058 5090 0 0 0 0 1667695 25876 635154 99917 11568 4 1787554 31
502015 6 5026410 0 0 0 4180 3915 0 0 2 0 972325 32594 646934 26475 1693 44 1015983 32
512015 7 2376972 0 0 0 3552 3605 0 0 1 0 810760 24182 760103 15854 2819 4 844354 33
522015 8 10669860 0 0 0 3587 3198 0 0 1 0 609604 31661 740370 13832 198 18 647575 34
532015 9 6045863 0 0 0 2765 1999 0 0 8 0 928916 29454 732099 16285 692 46 975421 35
542015 10 4974810 0 0 0 6352 2911 0 0 4 0 710801 29213 708182 43237 79 17 787392 36
552015 11 8715522 0 0 0 7074 3077 0 0 4 0 1525046 47050 785432 86677 1721 5 1687289 37
562015 12 6908196 0 0 0 5563 3165 0 0 5 0 2058710 49665 880370 46501 2373 4728 2185164 38
12016 1 4779455 0 0 0 3875 1913 0 0 3 0 2797426 56703 762277 242888 255 3 3108183 39
22016 2 5065078 693903 0 386412 3197 3491 11033 726 6 0 2345433 44778 901326 109533 1565 613 3638954 40
32016 3 51602331541987 0 748752 2812 1818 25675 1490 5 0 591897 51815 796692 136440 116 35 3176099 41
42016 4 32963481825167 5855 229651 4577 1791 42957 1174 0 0 363488 61778 862344 104171 2347 943 2716075 42
52016 5 6506231 901671 124049 180894 4199 1288 1007 2036 1 0 425712 81582 1055796 227998 151910 0 1995288 43
62016 6 8976199 826479 218334 377555 2644 1479 0 1616 6 0 418789 34802 1106725 131890 97124 32 2094670 44
72016 7 32689901566934 493931 388232 4084 1712 0 462 1 0 181784 29016 969499 130722 10064 16 2841879 45
82016 8 4243115 801790 334437 191945 3470 2048 0 547 1 0 533741 26142 976512 140048 75723 0 2086264 46
92016 9 3664996 969927 553192 35644 3874 1940 0 2417 1 0 544689 53899 958699 214614 15649 0 2444794 47
102016 10 30888331801981 360301 31123 4078 2445 0 5203 1 0 658796 34744 949767 41720 4440 6 2992992 48
112016 11 61307682259076 307356 57237 6030 3249 0 10702 0 0 1084130 39771 1043627 92633 893 0 3909370 49
122016 12 27951401469220 334905 12429 2436 2128 0 6155 5 0 361574 34580 920919 108448 20963 0 2371456 50
132017 1 22118071600324 345783 0 3029 3048 0 3443 3 0 1123873 33846 982559 47119 925 8 3211720 51
142017 2 2826225 794343 244928 0 3062 3964 0 8144 2 0 994879 45774 1117892 252695 10430 0 2385601 52
152017 3 79909822200757 982098 0 6716 3122 0 1560 2 3 495488 52092 1043426 177874 21128 0 3934714 53
162017 4 69264961686582 405861 0 4635 2539 0 2447 3 1 578396 51092 1088496 228599 13173 0 2975217 54
172017 5 2973306 620083 455634 0 3832 2796 0 1828 0 0 374917 41850 1077361 88669 35073 0 1616794 55

In [80]:
bot_edits = data.table(revision_agent_types_by_month_ordered_by_year_month$month_order)
bot_edits$edit = revision_agent_types_by_month_ordered_by_year_month$bot_edit
bot_edits$group = "Bot"
semi_automated_edits = data.table(revision_agent_types_by_month_ordered_by_year_month$month_order)
semi_automated_edits$edit = revision_agent_types_by_month_ordered_by_year_month$semi_automated
semi_automated_edits$group = "Semi-Automated"
human_edits = data.table(revision_agent_types_by_month_ordered_by_year_month$month_order)
human_edits$edit = revision_agent_types_by_month_ordered_by_year_month$human_edit
human_edits$group = "Human"
human_bot_like_edits = data.table(revision_agent_types_by_month_ordered_by_year_month$month_order)
human_bot_like_edits$edit = revision_agent_types_by_month_ordered_by_year_month$human_bot_like_edit
human_bot_like_edits$group = "bot-like human"
anon_edits = data.table(revision_agent_types_by_month_ordered_by_year_month$month_order)
anon_edits$edit = revision_agent_types_by_month_ordered_by_year_month$anon_edit
anon_edits$group = "Anonymous"
anon_bot_like_edits = data.table(revision_agent_types_by_month_ordered_by_year_month$month_order)
anon_bot_like_edits$edit = revision_agent_types_by_month_ordered_by_year_month$anon_bot_like_edit
anon_bot_like_edits$group = "bot-like anon"


edits_grouped_by_agent_type = rbind(rbind(rbind(
    bot_edits,
    semi_automated_edits),
    human_edits),
    anon_edits)
#     human_bot_like_edits),
#     anon_bot_like_edits)

colnames(edits_grouped_by_agent_type) = c('month_order', 'edits', 'group')

# edits_with_bots_grouped_by_agent_type = rbind(rbind(rbind(
#     semi_automated_edits,
#     human_edits),
#     bot_edits),
#     anon_edits)

# colnames(edits_with_bots_grouped_by_agent_type) = c('month_order', 'edits', 'group')

head(revision_agent_types_by_month_ordered_by_year_month, n=60)
# longitudinal_edits_grouped_by_agent_type$month = longitudinal_edits$month


yearmonthbot_editquickstatementspetscanautolist2autoeditlabellisteritemcreatordragrefjsrgChnot_flagged_elsewhere_quickstatments_bot_accountother_semi_automated_edit_since_change_taganon_edithuman_edittool_bot_like_edithuman_bot_like_editanon_bot_like_editsemi_automatedmonth_order
192012 11 700 0 0 0 0 0 0 0 0 0 0 517 263987 0 6887 0 0 1
202012 12 183629 0 0 0 18041 8063 0 0 0 0 0 2795 205204 0 673 0 26114 2
212013 1 1932349 0 0 0 19225 4528 0 0 0 0 0 2216 170870 0 15448 0 23754 3
222013 2 2285161 0 0 0 3741 3875 0 0 0 0 0 2073 183928 2 1273 0 7620 4
232013 3 2264112 0 0 0 2574 3411 0 0 0 0 0 8211 347624 0 2023 0 5991 5
242013 4 8067371 0 0 0 3326 4805 0 0 0 0 0 31878 808957 0 2727 0 8141 6
252013 5 13276100 0 0 0 0 0 0 0 0 0 0 42922 688842 0 6341 7 5 7
262013 6 13948677 0 0 0 0 0 0 0 0 0 0 42439 833282 0 4837 3 14 8
272013 7 3789628 0 0 0 0 0 0 0 0 0 0 55130 748370 0 839 7034 17 9
282013 8 8292060 0 0 0 0 0 0 0 0 0 0 37204 645670 0 12011 2130 11 10
292013 9 4028693 0 0 0 830 492 0 0 0 0 0 38752 687995 0 14690 4372 5052 11
302013 10 5075148 0 0 0 2982 3308 0 0 0 0 0 35374 676644 145 17728 1256 16546 12
312013 11 8359407 0 0 0 3184 2513 0 0 0 0 0 33368 466875 30 4058 43 15943 13
322013 12 6546802 0 0 0 3332 5149 0 0 0 0 0 34104 795749 236 1212 0 25402 14
332014 1 5576195 0 0 0 2593 9404 0 0 0 0 58310 27071 664747 11 674 35 85784 15
342014 2 8170379 0 0 0 3272 6634 0 0 0 0 91027 26425 672357 27729 9 19 147604 16
352014 3 4989090 0 0 0 4477 5534 0 0 1 0 117618 32945 625223 1291 2467 7 150195 17
362014 4 4747388 0 0 0 3364 3515 0 0 0 0 133952 35156 499857 1367 1279 1369 159416 18
372014 5 4263744 0 0 0 3995 4222 0 0 0 0 411027 34794 510866 6335 676 16 444981 19
382014 6 9239076 0 0 0 4600 5372 0 0 0 0 940944 43263 525234 7075 4898 0 987045 20
392014 7 4174522 0 0 0 5615 4094 0 0 0 0 1091168 33562 506274 14826 484 0 1137392 21
402014 8 3908321 0 0 0 3465 4331 0 0 0 0 1516042 37148 615219 12372 5091 0 1554529 22
412014 9 3313688 0 0 0 3590 4935 0 0 0 0 1101364 33585 596388 1297 5138 0 1132529 23
422014 10 3244385 0 0 0 3278 3268 0 0 0 0 1119244 41515 624790 13839 9068 0 1159231 24
432014 11 6345968 0 0 0 3656 3813 0 0 4 0 1370291 34137 541967 5382 3827 0 1398438 25
442014 12 6551805 0 0 0 2134 3200 0 0 0 0 873115 53068 555766 914 20633 2210 896241 26
452015 1 4767293 0 0 0 2592 2958 0 0 2 0 790679 36567 570928 1018 2972 3 810232 27
462015 2 4355602 0 0 0 4432 5294 0 0 2 0 932011 38226 666686 10055 168 0 961464 28
472015 3 3621741 0 0 0 5525 4781 0 0 0 0 838063 29872 695028 30219 378 0 886608 29
482015 4 4906989 0 0 0 3081 3672 0 0 0 0 899655 33464 696535 7582 40992 0 928413 30
492015 5 2495798 0 0 0 5058 5090 0 0 0 0 1667695 25876 635154 99917 11568 4 1787554 31
502015 6 5026410 0 0 0 4180 3915 0 0 2 0 972325 32594 646934 26475 1693 44 1015983 32
512015 7 2376972 0 0 0 3552 3605 0 0 1 0 810760 24182 760103 15854 2819 4 844354 33
522015 8 10669860 0 0 0 3587 3198 0 0 1 0 609604 31661 740370 13832 198 18 647575 34
532015 9 6045863 0 0 0 2765 1999 0 0 8 0 928916 29454 732099 16285 692 46 975421 35
542015 10 4974810 0 0 0 6352 2911 0 0 4 0 710801 29213 708182 43237 79 17 787392 36
552015 11 8715522 0 0 0 7074 3077 0 0 4 0 1525046 47050 785432 86677 1721 5 1687289 37
562015 12 6908196 0 0 0 5563 3165 0 0 5 0 2058710 49665 880370 46501 2373 4728 2185164 38
12016 1 4779455 0 0 0 3875 1913 0 0 3 0 2797426 56703 762277 242888 255 3 3108183 39
22016 2 5065078 693903 0 386412 3197 3491 11033 726 6 0 2345433 44778 901326 109533 1565 613 3638954 40
32016 3 51602331541987 0 748752 2812 1818 25675 1490 5 0 591897 51815 796692 136440 116 35 3176099 41
42016 4 32963481825167 5855 229651 4577 1791 42957 1174 0 0 363488 61778 862344 104171 2347 943 2716075 42
52016 5 6506231 901671 124049 180894 4199 1288 1007 2036 1 0 425712 81582 1055796 227998 151910 0 1995288 43
62016 6 8976199 826479 218334 377555 2644 1479 0 1616 6 0 418789 34802 1106725 131890 97124 32 2094670 44
72016 7 32689901566934 493931 388232 4084 1712 0 462 1 0 181784 29016 969499 130722 10064 16 2841879 45
82016 8 4243115 801790 334437 191945 3470 2048 0 547 1 0 533741 26142 976512 140048 75723 0 2086264 46
92016 9 3664996 969927 553192 35644 3874 1940 0 2417 1 0 544689 53899 958699 214614 15649 0 2444794 47
102016 10 30888331801981 360301 31123 4078 2445 0 5203 1 0 658796 34744 949767 41720 4440 6 2992992 48
112016 11 61307682259076 307356 57237 6030 3249 0 10702 0 0 1084130 39771 1043627 92633 893 0 3909370 49
122016 12 27951401469220 334905 12429 2436 2128 0 6155 5 0 361574 34580 920919 108448 20963 0 2371456 50
132017 1 22118071600324 345783 0 3029 3048 0 3443 3 0 1123873 33846 982559 47119 925 8 3211720 51
142017 2 2826225 794343 244928 0 3062 3964 0 8144 2 0 994879 45774 1117892 252695 10430 0 2385601 52
152017 3 79909822200757 982098 0 6716 3122 0 1560 2 3 495488 52092 1043426 177874 21128 0 3934714 53
162017 4 69264961686582 405861 0 4635 2539 0 2447 3 1 578396 51092 1088496 228599 13173 0 2975217 54
172017 5 2973306 620083 455634 0 3832 2796 0 1828 0 0 374917 41850 1077361 88669 35073 0 1616794 55

In [81]:
ggplot(edits_grouped_by_agent_type,
       aes(x=month_order, y=edits, color=group, linetype=group)) + geom_point() + geom_line() + geom_smooth(method = 'lm') +
ggtitle("Agent Type By Month") +
xlab("Month") +
ylab("Edits") +
scale_x_continuous(breaks=(c(3,15,27, 39, 51)),labels=c("Jan 2013", "Jan 2014", "Jan 2015", "Jan 2016", "Jan 2017")) +
scale_color_viridis(discrete=TRUE)



In [70]:
ggplot(edits_grouped_by_agent_type[edits_grouped_by_agent_type$group == 'Anonymous',],
       aes(x=month_order, y=edits, color=group, linetype=group)) + geom_point() + geom_line() + geom_smooth(method = 'lm') +
xlab("Month") +
ylab("Edits") +
scale_x_continuous(breaks=(c(3,15,27, 39, 51)),labels=c("Jan 2013", "Jan 2014", "Jan 2015", "Jan 2016", "Jan 2017")) +
ggtitle("Agent Type By Month") +
scale_color_viridis(discrete=TRUE)



In [ ]:


In [ ]:


In [ ]:


In [ ]:
ggplot(edits_grouped_by_agent_type,
       aes(x=month_order, y=edits, color=group, linetype=group)) + geom_point() + geom_line() +
ggtitle("Agent Type By Month") +
scale_color_viridis(discrete=TRUE)

In [35]:
error_metrics_2012 <- read.table("../../../results/misalignment_edit_types_tables_and_queries/2012_error_metrics.tsv", header=FALSE, sep="\t")
error_metrics_2013 <- read.table("../../../results/misalignment_edit_types_tables_and_queries/2013_error_metrics.tsv", header=FALSE, sep="\t")
error_metrics_2014 <- read.table("../../../results/misalignment_edit_types_tables_and_queries/2014_error_metrics.tsv", header=FALSE, sep="\t")
error_metrics_2015 <- read.table("../../../results/misalignment_edit_types_tables_and_queries/2015_error_metrics.tsv", header=FALSE, sep="\t")
error_metrics_2016 <- read.table("../../../results/misalignment_edit_types_tables_and_queries/2016_error_metrics.tsv", header=FALSE, sep="\t")
error_metrics_2017 <- read.table("../../../results/misalignment_edit_types_tables_and_queries/2017_error_metrics.tsv", header=FALSE, sep="\t")

In [36]:
colnames(error_metrics_2012) <- c('YYYY', 'MM', 'ME','MAE', 'Median', 'Median_Absolute_Error', 'MAD', 'RMSE', 'RMSE_WITH_SIGN')
colnames(error_metrics_2013) <- c('YYYY', 'MM', 'ME','MAE', 'Median', 'Median_Absolute_Error', 'MAD', 'RMSE', 'RMSE_WITH_SIGN')
colnames(error_metrics_2014) <- c('YYYY', 'MM', 'ME','MAE', 'Median', 'Median_Absolute_Error', 'MAD', 'RMSE', 'RMSE_WITH_SIGN')
colnames(error_metrics_2015) <- c('YYYY', 'MM', 'ME','MAE', 'Median', 'Median_Absolute_Error', 'MAD', 'RMSE', 'RMSE_WITH_SIGN')
colnames(error_metrics_2016) <- c('YYYY', 'MM', 'ME','MAE', 'Median', 'Median_Absolute_Error', 'MAD', 'RMSE', 'RMSE_WITH_SIGN')
colnames(error_metrics_2017) <- c('YYYY', 'MM', 'ME','MAE', 'Median', 'Median_Absolute_Error', 'MAD', 'RMSE', 'RMSE_WITH_SIGN')

In [37]:
error_metrics = rbind(rbind(rbind(rbind(rbind(
    error_metrics_2012,
    error_metrics_2013),
    error_metrics_2014),
    error_metrics_2015),
    error_metrics_2016),
    error_metrics_2017)

In [38]:
error_metrics$month = 1:56
head(error_metrics,n=60)


YYYYMMMEMAEMedianMedian_Absolute_ErrorMADRMSERMSE_WITH_SIGNmonth
2012 11 -1.214190e-110.0004613921 0.000000000 0.00000000 0.00000000 0.02507513 -0.003222884 1
2012 12 -4.113368e-090.0182297583 0.000000000 0.00000000 0.00000000 0.14833423 0.021742517 2
2013 1 -1.656790e-060.1295226665 0.000000000 0.00000000 0.00000000 0.37151011 0.038717770 3
2013 2 -3.108226e-050.2151646521 0.000000000 0.00000000 0.00000000 0.47535853 0.006874465 4
2013 3 -6.008570e-050.2648199270 0.000000000 0.00000000 0.00000000 0.52396219 -0.014517413 5
2013 4 -6.744700e-050.3326550593 0.000000000 0.00000000 0.00000000 0.58777596 -0.013591795 6
2013 5 -4.358535e-040.3855384165 0.000000000 0.02256244 0.02256244 0.64643804 -0.050446242 7
2013 6 -4.246231e-040.4313284147 0.000000000 0.05473322 0.05473322 0.69271373 -0.088371543 8
2013 7 -9.161221e-040.4475288346 0.000000000 0.06417301 0.06417301 0.71156448 -0.098673785 9
2013 8 -3.730509e-040.4818761758 0.000000000 0.12789462 0.12789462 0.73712761 -0.098437357 10
2013 9 -3.004899e-040.4953164144 0.000000000 0.15033720 0.15033720 0.74799385 -0.108733099 11
2013 10 -5.304632e-040.5136112598 0.000000000 0.18998062 0.18998062 0.76465586 -0.121336961 12
2013 11 -5.687968e-040.5308135471 0.000000000 0.20867183 0.20867183 0.78318176 -0.117528274 13
2013 12 -1.694638e-030.5473176994 0.000000000 0.26134351 0.26134351 0.80001109 -0.105306938 14
2014 1 -1.726267e-030.5595629381 0.000000000 0.27882139 0.27882139 0.81136077 -0.107519881 15
2014 2 -1.394824e-030.5723376788 0.000000000 0.29964728 0.29964728 0.82223918 -0.109394177 16
2014 3 -1.964296e-030.5833584135 0.000000000 0.31324510 0.31324510 0.83567031 -0.097505674 17
2014 4 -2.394431e-030.6094471068 0.000000000 0.34909777 0.34909777 0.87249836 0.078268641 18
2014 5 -1.384440e-030.5931214968 0.000000000 0.31020822 0.31020822 0.85906070 0.102157567 19
2014 6 -3.324659e-030.5896991495 0.000000000 0.30700902 0.30700902 0.85776494 0.114374404 20
2014 7 -7.087882e-040.5952483821 0.000000000 0.31038416 0.31038416 0.86364972 0.149126064 21
2014 8 -3.098223e-030.6076237993 0.000000000 0.31576891 0.31576891 0.88288227 0.167837567 22
2014 9 -1.442524e-030.6325354826 0.000000000 0.34909777 0.34909777 0.91370328 0.220620404 23
2014 10 -7.347802e-040.6486054150 0.000000000 0.37117346 0.37117346 0.93103541 0.249206712 24
2014 11 -1.776425e-030.6598324896 0.000000000 0.38169978 0.38169978 0.94143988 0.251515571 25
2014 12 -3.125664e-030.6720828256 0.000000000 0.43534295 0.43534295 0.95344862 0.256907022 26
2015 1 -3.554674e-030.6789227478 0.000000000 0.46536441 0.46536441 0.96062842 0.257872655 27
2015 2 -4.282466e-030.6859785941 0.000000000 0.54665289 0.54665289 0.96030690 0.219949376 28
2015 3 -2.807454e-030.7011225949 0.000000000 0.63077363 0.63077363 0.96919503 0.188506297 29
2015 4 -3.815355e-030.7148594639 0.000000000 0.65959565 0.65959565 0.97589280 0.160004968 30
2015 5 -5.726941e-030.7209286992 0.000000000 0.66624177 0.66624177 0.98224734 0.155891595 31
2015 6 -6.199753e-030.7395507740 0.000000000 0.67618352 0.67618352 1.01258409 0.211402526 32
2015 7 -8.162735e-030.7292295945 0.000000000 0.66941169 0.66941169 0.99448087 0.164391087 33
2015 8 -4.415043e-030.7978280524 0.000000000 0.69282655 0.69282655 1.11009313 0.332729736 34
2015 9 -1.217399e-030.8231079988 0.000000000 0.69841090 0.69841090 1.15010563 0.377485602 35
2015 10 -7.932963e-030.8312560351 0.000000000 0.71019017 0.71019017 1.15565399 0.360621528 36
2015 11 -1.233560e-020.8395066310 0.000000000 0.73461052 0.73461052 1.15803013 0.335838493 37
2015 12 -2.046404e-030.8525660610 0.000000000 0.75165364 0.75165364 1.17089763 0.364289702 38
2016 1 -6.533449e-030.8546512658 0.000000000 0.76457882 0.76457882 1.16345887 0.335496988 39
2016 2 -1.132153e-020.8578624269 0.000000000 0.78149368 0.78149368 1.15761022 0.291855294 40
2016 3 -7.819968e-030.8589182857 0.000000000 0.78447766 0.78447766 1.15057136 0.262563336 41
2016 4 -2.784973e-030.8607135865 0.000000000 0.78682511 0.78682511 1.15253299 0.278170666 42
2016 5 -1.923231e-020.8567973420 0.000000000 0.78238761 0.78238761 1.13919807 0.191907752 43
2016 6 -1.259118e-020.8614304415 0.000000000 0.78993325 0.78993325 1.14085331 0.217776901 44
2016 7 -1.924786e-020.8344977294 0.000000000 0.74869199 0.74869199 1.10906585 0.134941610 45
2016 8 -1.069103e-020.7879774111 0.000000000 0.65417246 0.65417246 1.06472479 0.080976401 46
2016 9 -6.508924e-030.7875788159 0.001352363 0.65201094 0.65201113 1.06313687 0.118194949 47
2016 10 -4.528150e-020.7502973623 0.003105619 0.57514691 0.57524289 1.02441171 -0.251557385 48
2016 11 -3.816349e-020.7475307322 0.002924242 0.56879427 0.56809041 1.02287691 -0.231622441 49
2016 12 -3.202052e-020.7440359815 0.003106352 0.55944403 0.55917647 1.01936160 -0.211924468 50
2017 1 -2.862309e-020.7475030164 0.002274990 0.58049667 0.58008351 1.01963670 -0.201467503 51
2017 2 -2.038818e-020.7410495784 0.003195736 0.56676239 0.56651239 1.01246255 -0.152024039 52
2017 3 -1.458780e-020.7518986097 0.006912472 0.60166954 0.60117497 1.01488064 -0.145253290 53
2017 4 -9.733399e-030.7490939362 0.004813967 0.59426448 0.59421278 1.01092655 -0.116357991 54
2017 5 -1.552406e-030.7500804345 0.006592750 0.60889218 0.60943319 1.00791956 -0.085716235 55
2017 6 -1.587324e-030.7528427555 0.006912472 0.61746087 0.61688744 1.00841076 -0.090995863 56

In [39]:
ggplot(error_metrics,
       aes(x=month, y=ME)) + geom_point() + 
ggtitle("Mean Error Over Time") + geom_line() +
xlab("month") +
scale_x_continuous(breaks=(c(3,15,27, 39, 51)),labels=c("Jan 2013", "Jan 2014", "Jan 2015", "Jan 2016", "Jan 2017")) +
scale_color_viridis(discrete=TRUE)



In [40]:
ggplot(error_metrics,
       aes(x=month, y=MAE)) + geom_point() + 
ggtitle("Mean Absolute Error Over Time") + geom_line() +
xlab("Month") +
scale_x_continuous(breaks=(c(3,15,27, 39, 51)),labels=c("Jan 2013", "Jan 2014", "Jan 2015", "Jan 2016", "Jan 2017")) +
scale_color_viridis(discrete=TRUE)



In [41]:
ggplot(error_metrics,
       aes(x=month, y=RMSE)) + geom_point() + 
ggtitle("Root-Mean-Square Error Over Time") + geom_line() +
xlab("Month") +
scale_x_continuous(breaks=(c(3,15,27, 39, 51)),labels=c("Jan 2013", "Jan 2014", "Jan 2015", "Jan 2016", "Jan 2017")) +
scale_color_viridis(discrete=TRUE)



In [42]:
ggplot(error_metrics,
       aes(x=month, y=RMSE_WITH_SIGN)) + geom_point() + 
ggtitle("Root Mean Squared Error With Sign Over Time") + geom_line() +
xlab("month") +
scale_x_continuous(breaks=(c(3,15,27, 39, 51)),labels=c("Jan 2013", "Jan 2014", "Jan 2015", "Jan 2016", "Jan 2017")) +
scale_color_viridis(discrete=TRUE)



In [43]:
ggplot(error_metrics,
       aes(x=month, y=Median)) + geom_point() + 
ggtitle("Median Over Time") + geom_line() +
xlab("month") +
scale_x_continuous(breaks=(c(3,15,27, 39, 51)),labels=c("Jan 2013", "Jan 2014", "Jan 2015", "Jan 2016", "Jan 2017")) +
scale_color_viridis(discrete=TRUE)



In [44]:
ggplot(error_metrics,
       aes(x=month, y=Median_Absolute_Error)) + geom_point() + 
ggtitle("Median Absolute Error Over Time") + geom_line() +
xlab("month") +
scale_x_continuous(breaks=(c(3,15,27, 39, 51)),labels=c("Jan 2013", "Jan 2014", "Jan 2015", "Jan 2016", "Jan 2017")) +
scale_color_viridis(discrete=TRUE)



In [45]:
ggplot(error_metrics,
       aes(x=month, y=MAD)) + geom_point() + 
ggtitle("Median Absolute Deviation Over Time") + geom_line() +
xlab("Month") +
scale_x_continuous(breaks=(c(3,15,27, 39, 51)),labels=c("Jan 2013", "Jan 2014", "Jan 2015", "Jan 2016", "Jan 2017")) +
scale_color_viridis(discrete=TRUE)



In [46]:
summary(error_metrics)


      YYYY            MM               ME                  MAE           
 Min.   :2012   Min.   : 1.000   Min.   :-0.0452815   Min.   :0.0004614  
 1st Qu.:2014   1st Qu.: 3.000   1st Qu.:-0.0079904   1st Qu.:0.5565016  
 Median :2015   Median : 6.000   Median :-0.0027962   Median :0.6935506  
 Mean   :2015   Mean   : 6.357   Mean   :-0.0067794   Mean   :0.6344153  
 3rd Qu.:2016   3rd Qu.: 9.250   3rd Qu.:-0.0008708   3rd Qu.:0.7615268  
 Max.   :2017   Max.   :12.000   Max.   : 0.0000000   Max.   :0.8614304  
     Median          Median_Absolute_Error      MAD              RMSE        
 Min.   :0.0000000   Min.   :0.0000        Min.   :0.0000   Min.   :0.02508  
 1st Qu.:0.0000000   1st Qu.:0.2745        1st Qu.:0.2745   1st Qu.:0.80852  
 Median :0.0000000   Median :0.5530        Median :0.5529   Median :0.96491  
 Mean   :0.0007356   Mean   :0.4468        Mean   :0.4468   Mean   :0.90076  
 3rd Qu.:0.0000000   3rd Qu.:0.6670        3rd Qu.:0.6670   3rd Qu.:1.03409  
 Max.   :0.0069125   Max.   :0.7899        Max.   :0.7899   Max.   :1.17090  
 RMSE_WITH_SIGN         month      
 Min.   :-0.25156   Min.   : 1.00  
 1st Qu.:-0.09850   1st Qu.:14.75  
 Median : 0.09157   Median :28.50  
 Mean   : 0.07280   Mean   :28.50  
 3rd Qu.: 0.22012   3rd Qu.:42.25  
 Max.   : 0.37749   Max.   :56.00  

In [ ]:


In [ ]: