Last active
October 29, 2015 19:49
-
-
Save rspeer/4c90067d8570eff43208 to your computer and use it in GitHub Desktop.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
>>> import wordfreq, langcodes | |
>>> def legible_list(lst): | |
... return('\N{LEFT-TO-RIGHT MARK}, '.join(lst)) | |
... | |
>>> for lang in sorted(wordfreq.available_languages()): | |
... language_name = langcodes.get(lang).language_name('en') | |
... top_ten = legible_list(wordfreq.top_n_list(lang, 10)) | |
... print('%-3s %-12s %s' % (lang, language_name, top_ten)) | |
... | |
ar Arabic في, من, على, لا, أن, rt, و, ما, هذا, إلى | |
de German die, der, und, ich, in, das, ist, sie, nicht, von | |
el Greek και, το, να, του, η, την, με, τησ, είναι, ο | |
en English the, of, to, and, in, a, i, you, it, is | |
es Spanish de, la, que, el, en, y, a, no, los, es | |
fr French de, la, le, et, est, à, les, en, je, un | |
id Indonesian yang, dan, di, ini, rt, dari, untuk, adalah, itu, dengan | |
it Italian di, e, che, il, la, a, non, in, un, è | |
ja Japanese の, に, は, て, た, が, を, で, と, し | |
ko Korean rt, ♥, 있다, 이, 수, 그, 있는, 아, 는, ♡ | |
ms Malay yang, aku, di, dan, rt, tidak, ini, kau, itu, untuk | |
nl Dutch de, ik, je, het, een, is, van, en, in, dat | |
pl Polish w, nie, i, się, na, to, z, rt, do, jest | |
pt Portuguese de, a, o, que, e, não, é, do, da, em | |
ru Russian в, и, не, я, на, что, с, это, как, а | |
sv Swedish är, i, jag, och, det, att, en, på, som, du | |
tr Turkish bir, ve, rt, bu, ne, de, için, çok, da, ben | |
zh Chinese 的, 我, 了, 是, 你, 在, 不, 他, 一, 这 |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment