Last active
November 7, 2019 09:42
-
-
Save rwst/7adf285a98521ed06bbf271b1cc55eb0 to your computer and use it in GitHub Desktop.
produces QS commands to move all sitelinks from a list of WD items to corresponding items
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
import csv | |
from sys import * | |
reader = csv.DictReader(open('genes-wikipedia.tab', 'r'), delimiter='\t') | |
gqs = {} | |
for item in reader: | |
iturl = item.get('p') | |
qit = iturl[iturl.rfind('/')+1:] | |
lang = item.get('lang') | |
lemma = item.get('lemma') | |
d = gqs.get(qit) | |
if d is None: | |
d = {} | |
d[lang] = lemma | |
gqs[qit] = d | |
else: | |
d[lang] = lemma | |
reader = csv.DictReader(open('proteins-wikipedia.tab', 'r'), delimiter='\t') | |
pqs = {} | |
for item in reader: | |
iturl = item.get('p') | |
qit = iturl[iturl.rfind('/')+1:] | |
lang = item.get('lang') | |
lemma = item.get('lemma') | |
d = pqs.get(qit) | |
if d is None: | |
d = {} | |
d[lang] = lemma | |
pqs[qit] = d | |
else: | |
d[lang] = lemma | |
its = set() | |
dits = set() | |
reader = csv.DictReader(open('t.tab', 'r'), delimiter='\t') | |
for item in reader: | |
iturl = item.get('g') | |
git = iturl[iturl.rfind('/')+1:] | |
if git in its: | |
dits.add(git) | |
else: | |
its.add(git) | |
reader = csv.DictReader(open('t.tab', 'r'), delimiter='\t') | |
for item in reader: | |
iturl = item.get('g') | |
git = iturl[iturl.rfind('/')+1:] | |
if git in dits: | |
continue | |
iturl = item.get('p') | |
pit = iturl[iturl.rfind('/')+1:] | |
g = gqs.get(git) | |
p = pqs.get(pit) | |
l = [] | |
if g is None: | |
continue | |
for glang in g.keys(): | |
if p is None or p.get(glang) is None: | |
l.append((glang, g.get(glang))) | |
for link in l: | |
print('-{}|S{}wiki|""'.format(git, link[0])) | |
for link in l: | |
print('{}|S{}wiki|"{}"'.format(pit, link[0], link[1])) | |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment