This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#!/usr/bin/awk -f | |
BEGIN { | |
# significance level | |
if (length(ALPHA) == 0) ALPHA = 0.05; | |
# standard error estimation method: "basic" or "pooled" | |
if (length(SE) == 0) SE = "basic"; | |
# one-tailed or two-tailed? | |
if (TAILS != 2) TAILS = 1; |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#!/usr/bin/env python | |
# This script computes the normalized modified purity and inverse purity | |
# as according to this paper: https://aclweb.org/anthology/P14-1097. | |
# In fact, this program is currently quite a rough translation of | |
# the evaluation-verb-classes.perl script provided by Daisuke Kawahara. | |
import argparse | |
import re | |
import sys |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
LC_COLLATE = C | |
SEED = 1337 | |
WCL_WRAPPER = /srv/definitions/wcl-extract | |
measure: | |
./measure.py | |
kfold: wiki_really_all.txt | |
./kfold.py --seed=$(SEED) $< |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#!/usr/bin/env groovy | |
import org.apache.commons.math3.stat.descriptive.moment.Mean | |
import org.apache.commons.math3.stat.descriptive.moment.StandardDeviation | |
import org.jgrapht.graph.SimpleWeightedGraph | |
import org.jgrapht.util.SupplierUtil | |
import org.nlpub.watset.graph.ChineseWhispers | |
import org.nlpub.watset.graph.NodeWeighting | |
import org.nlpub.watset.graph.MaxMax | |
import org.nlpub.watset.eval.Measurer | |
import org.nlpub.watset.graph.Watset |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#!/usr/bin/env python3 | |
__author__ = 'Dmitry Ustalov' | |
__credits__ = 'Sebastian Padó' | |
__license__ = 'MIT' | |
# This is an MIT-licensed implementation of the sigf toolkit for randomization tests: | |
# https://nlpado.de/~sebastian/software/sigf.shtml | |
import random |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
WATSET ?= ../watset-java/target/watset.jar | |
LCC ?= ../lcc | |
export LANG:=en_US.UTF-8 | |
export LC_COLLATE:=C | |
export CLASSPATH := $(WATSET) | |
nodes: | |
cut -f1,2 $(LCC)/eng_news_2016_10K/eng_news_2016_10K-co_s.txt | sed -re 's/\t/\n/g' | sort -u | wc -l | |
cut -f1,2 $(LCC)/eng_news_2016_30K/eng_news_2016_30K-co_s.txt | sed -re 's/\t/\n/g' | sort -u | wc -l |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#!/bin/sh -eu | |
CWD=$(basename "$PWD") | |
XZ_OPT="-T 0" exec tar --exclude '*~' -C ../ -cJvf "../$CWD.tar.xz" "$CWD" |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#!/usr/bin/env python3 | |
""" | |
An implementation of the Bradley-Terry ranking aggregation algorithm from the paper | |
MM algorithms for generalized Bradley-Terry models | |
<https://doi.org/10.1214/aos/1079120141>. | |
""" | |
__author__ = 'Dmitry Ustalov' | |
__copyright__ = 'Copyright 2021 Dmitry Ustalov' |
OlderNewer