Skip to content

Instantly share code, notes, and snippets.

git config --global color.diff auto
git config --global color.status auto
git config --global color.branch auto
git config --global color.grep auto
git config --global core.excludesfile $HOME/.gitignore
git config --global diff.algorithm patience
git config --global push.default current
git config --global alias.st status
@mrorii
mrorii / build.gradle
Last active August 29, 2015 14:02
logback + logstash
dependencies {
compile group: 'net.logstash.logback', name: 'logstash-logback-encoder', version: '2.8'
}
{"website": "http://quora.com", "industries": "Internet", "name": "Quora", "company_type": "Privately Held", "universal_name": "quora", "specialties": [], "location": {"country": "United States", "region": "CA", "postal_code": "94041", "street_address": "650 Castro Street", "locality": "Mountain View,"}, "employee_count": "51-200 employees", "founded_year": ""}
{"website": "http://www.dropbox.com", "industries": "Internet", "name": "Dropbox", "company_type": "Privately Held", "universal_name": "dropbox", "specialties": ["cross-platform file sync", "file sharing", "online backup", "cloud storage"], "location": {}, "employee_count": "201-500 employees", "founded_year": "2007"}
{"website": "http://www.facebook.com/", "industries": "Internet", "name": "Facebook", "company_type": "Public Company", "universal_name": "facebook", "specialties": [], "location": {"country": "United States", "region": "CA", "postal_code": "94025", "street_address": "1 Hacker Way", "locality": "Menlo Park,"}, "employee_count": "5001-10,0
orii[10605]$ python -m cdec.sa.extract -c cpad/extract.ini -g cpad/dev.grammars -z < cpad/cookpad.dev.ja-en > cpad/cookpad.dev.ja-en.sgm
INFO:cdec.sa:Sampling strategy: uniform, max sample size = 300
INFO:cdec.sa:Reading precomputed data from file /home/orii/cdec/cpad/training.sa/precomp.5.2.15.1.100.10.bin...
INFO:cdec.sa:Converting 42 hash keys on precomputed inverted index...
INFO:cdec.sa:Converting 7564 hash keys on precomputed collocations...
INFO:cdec.sa:Processing precomputations took 0.084005 seconds
Traceback (most recent call last):
File "/home/orii/Canopy/appdata/canopy-1.0.3.1262.rh5-x86/lib/python2.7/runpy.py", line 162, in _run_module_as_main
"__main__", fname, loader, pkg_name)
File "/home/orii/Canopy/appdata/canopy-1.0.3.1262.rh5-x86/lib/python2.7/runpy.py", line 72, in _run_code
@mrorii
mrorii / check_cookpad_en.py
Last active December 21, 2015 11:59
Check number of recipes on https://en.cookpad.com/
#!/usr/bin/env python
import os
import time
import urlparse
import requests
from scrapy.selector import HtmlXPathSelector
def get_count(url):
#!/usr/bin/env python
import gzip
try:
import cStringIO as StringIO
except:
import StringIO
# ...
package hw8;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.conf.Configured;
import org.apache.hadoop.filecache.DistributedCache;
import org.apache.hadoop.fs.FileStatus;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.mapreduce.Job;
DROP TABLE IF EXISTS user;
CREATE TABLE user (
id int NOT NULL auto_increment,
name varchar(100) NOT NULL default '',
registerDate timestamp NOT NULL default CURRENT_TIMESTAMP,
group int NOT NULL default '0',
PRIMARY KEY (id)
) ENGINE=InnoDB DEFAULT CHARSET=utf8;
DROP TABLE IF EXISTS decoration_binary;
<?xml version="1.0" encoding="utf-8"?>
<xmi:XMI xmlns:bio="http:///edu/cmu/lti/bio.ecore"
xmlns:cas="http:///uima/cas.ecore"
xmlns:oaqa="http:///edu/cmu/lti/oaqa.ecore"
xmlns:xmi="http://www.omg.org/XMI"
xmlns:trec="http:///edu/cmu/lti/bio/trec.ecore"
xmlns:model="http:///org/oaqa/model.ecore"
xmlns:ie="http:///edu/cmu/lti/bio/ie.ecore"
xmlns:types="http:///edu/cmu/lti/oaqa/framework/types.ecore"
xmlns:tcas="http:///uima/tcas.ecore"
@mrorii
mrorii / output
Created January 17, 2013 04:23
Simple script for checking whether estimators call check_arrays in fit
Estimator Calls check_arrays?
RandomForestClassifier True
RBFSampler False
LDA True
GaussianNB True
LinearSVC False
SVC False