Skip to content

Instantly share code, notes, and snippets.

["__cs", "__dx", "__d4", "__gv", "__oq", "__ov", "__qc", "__qy", "__uw", "__vt", "__vu", "__v5", "__xj", "__xv", "__yw", "__y3", "__1r", "__1u", "__2e", "__2j", "__2v", "__3j", "__3p", "__3q", "__3r", "__4h", "__4q", "__4t", "__4v", "__4w", "__4y", "__5c", "__5e", "__5i", "__5p", "__5q", "__5r", "__5t", "__5u", "__5v", "__5w", "__5y", "__6g", "__7r", "__8k", "__8l", "__8q", "__9j", "__9p", "_acq", "_ac0", "_ae0", "_ae2", "_ae9", "_agl", "_ag0", "_ahv", "_ahx", "_ahy", "_ah9", "_aj8", "_ak8", "_al6", "_am6", "_an5", "_an8", "_apq", "_ap0", "_aqg", "_aqj", "_aq4", "_aq7", "_aq9", "_as8", "_at5", "_auw", "_au0", "_au2", "_au5", "_au6", "_au9", "_avj", "_avq", "_avx", "_av1", "_av2", "_av5", "_av6", "_av8", "_aw8", "_aw9", "_axb", "_axf", "_axj", "_axq", "_axw", "_ay2", "_ay4", "_ay6", "_a0e", "_a0f", "_a0k", "_a0l", "_a0m", "_a0u", "_a0w", "_a1l", "_a1n", "_a1p", "_a1u", "_a1w", "_a2d", "_a2e", "_a2f", "_a2j", "_a2o", "_a2q", "_a3c", "_a3e", "_a3f", "_a3h", "_a3u", "_a3x", "_a3y", "_a4b", "_a4f", "_a4g", "_a4h",
feature name description
ah_actions number of actions included in Template:Article History on the article
ah_article_history the full content of Tempalte:Article History
ah_assessment_average the average quality assessment by all of the wikiprojects that assessed this article
ah_assessment_count total number of quality assessments by all of the projects for this article
ah_assessment_list list of all the assessments by all of the wikiprojects for this article
ah_current the current assessment according to Template:Article History
ah_latest_action_age time since the latest assessment action was taken according to Template:Article History
ah_oldest_action_age time since the first assessment action was taken on this article
@slaporte
slaporte / FAs.md
Last active January 23, 2018 02:42
cat_contains_1800 cat_contains_19th_century cat_contains_history infobox_contains_1800 intro_p_contains_1800 title total_history_freq
2 1 0 False True Golding Bird 0.000487995315245
1 0 2 False False Pedro Álvares Cabral 0.00181268882175
1 0 0 True True Princess Alice of Battenberg 0.000224719101124
1 0 0 True True Stan Coveleski 0.00139508928571
0 0 0 False False Bryan Gunn 0.000414651002073
1 0 0 False True Guy Bradley 0.000303398058252
0 0 0 False False Audioslave 0.000673945275644
0 0 0 False False James Robert Baker 0.00108932461874
# -*- coding: utf-8 -*-
IRREGULAR_PLURALS = {'alumnus': 'alumni',
'cactus': 'cacti',
'focus': 'foci',
'fungus': 'fungi',
'nucleus': 'nuclei',
'radius': 'radii',
'stimulus': 'stimuli',
'axis': 'axes',
This file has been truncated, but you can view the full file.
title id ah_current ah_assessment_average word_count cite_count cite_journal cite_book cite_web
Hardie Gramatky 5009744 NO B 733 5 0 0 1
Harry Crosby 179529 NO B 4791 37 0 8 22
Dallin H. Oaks 183662 NO B 1842 27 0 0 6
Charles Groves Wright Anderson 826250 NO B 1469 13 0 2 7
Raid at Combahee Ferry 9350667 NO B 2158 12 0 0 0
Luther Alexander Gotwald 18199681 NO B 9822 85 0 1 0
Virginia State University 586866 NO B 2266 31 0 0 31
Battle of the Ch'ongch'on River 25558340 GA GA 8473 234 0 0 2
Bothell, Washington 151275 NO B 2258 36 0 0 11
@slaporte
slaporte / stat_lists.py
Created November 18, 2012 07:46
qualityvis stat lists
structure = [
'd_fr_sect_count',
'd_has_ext_link_sect',
'd_has_notes_sect',
'd_has_ref_sect',
'd_ext_link_sect_li_count',
'd_thumb_left_count',
'd_thumb_right_count',
'd_int_link_text_count',
media_attrs = ['d_all_img_count',
'd_geo_count',
'd_image_map_count',
'd_ipa_count',
'd_midi_count',
'd_ogg_count',
'd_pdf_count',
'd_spoken_wp_count',
'd_svg_count',
[('w_per_d_int_link_text_mean', (6.0, 99.999999999999986, 100.0)), ('w_per_d_spoken_wp_count', (5.0, 22.577742708935169, 23.770124639507372)), ('w_per_d_h2_text_rel_std_dev', (4.0, 14.471598650263878, 15.482189959570947)), ('w_per_d_caption_word_mean_trimmed', (3.0, 5.7619132808119673, 6.6283144220189563))]
[('d_word_count', (6.0, 100.0, 99.999999999999986)), ('d_thumb_right_count', (5.0, 22.179757861855681, 23.332685527701166)), ('d_spoken_wp_count', (4.0, 13.471589052699164, 14.463359298026649)), ('d_h2_text_rel_std_dev', (3.0, 7.1381725095355932, 7.9374177678378803))]
[('d_word_count', (14.0, 100.0, 100.0)), ('d_thumb_right_count', (13.0, 31.302728818298792, 33.166031248246895)), ('d_spoken_wp_count', (12.0, 23.571797752505049, 25.434284334151592)), ('d_h2_text_rel_std_dev', (11.0, 17.937711328380029, 19.745359721277694)), ('d_p_median', (10.0, 12.91909193432876, 14.663181514100341)), ('d_has_notes_sect', (9.0, 10.486430177615439, 12.083929495472743)), ('d_cite_journal', (8.0, 8.1500972384260066, 9.60310
== Learner results ==
CA Sens Spec AUC IS F1 Prec Recall Brier MCC
d_Earth 0.7581 0.7806 0.7352 0.8354 0.3776 0.7646 0.7493 0.7806 0.3384 0.5164
d_CN2 0.7244 0.8544 0.5925 0.7783 0.1917 0.7574 0.6801 0.8544 0.4005 0.4635
rv_wo_Earth 0.7452 0.8220 0.6674 0.8179 0.3347 0.7646 0.7147 0.8220 0.3821 0.4955
rv_all_Earth 0.7330 0.7368 0.7290 0.8215 0.3455 0.7353 0.7338 0.7368 0.3464 0.4659
rv_all_CN2 0.7389 0.8893 0.5863 0.8013 0.2613 0.7742 0.6855 0.8893 0.3669 0.4996
rv_t_Earth 0.6711 0.6638 0.6785 0.7191 0.1729 0.6702 0.6767 0.6638 0.4307 0.3423
links_Earth 0.6321 0.6610 0.6028 0.6837 0.1221 0.6440 0.6279 0.6610 0.4505 0.2643