Last active
May 12, 2016 09:03
-
-
Save sirex/d65113958a062586c1d484921648057d to your computer and use it in GitHub Desktop.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
{ | |
"cells": [ | |
{ | |
"cell_type": "code", | |
"execution_count": 1, | |
"metadata": { | |
"collapsed": true | |
}, | |
"outputs": [], | |
"source": [ | |
"import datapackage" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 2, | |
"metadata": { | |
"collapsed": true | |
}, | |
"outputs": [], | |
"source": [ | |
"storage = datapackage.push_datapackage('http://data.okfn.org/data/core/country-list/datapackage.json', 'pandas')" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 3, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/plain": [ | |
"['data___data']" | |
] | |
}, | |
"execution_count": 3, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"storage.tables" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 4, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/plain": [ | |
"pandas.core.frame.DataFrame" | |
] | |
}, | |
"execution_count": 4, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"type(storage['data___data'])" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 5, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/html": [ | |
"<div>\n", | |
"<table border=\"1\" class=\"dataframe\">\n", | |
" <thead>\n", | |
" <tr style=\"text-align: right;\">\n", | |
" <th></th>\n", | |
" <th>Name</th>\n", | |
" <th>Code</th>\n", | |
" </tr>\n", | |
" </thead>\n", | |
" <tbody>\n", | |
" <tr>\n", | |
" <th>0</th>\n", | |
" <td>Afghanistan</td>\n", | |
" <td>AF</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1</th>\n", | |
" <td>Åland Islands</td>\n", | |
" <td>AX</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>2</th>\n", | |
" <td>Albania</td>\n", | |
" <td>AL</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>3</th>\n", | |
" <td>Algeria</td>\n", | |
" <td>DZ</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>4</th>\n", | |
" <td>American Samoa</td>\n", | |
" <td>AS</td>\n", | |
" </tr>\n", | |
" </tbody>\n", | |
"</table>\n", | |
"</div>" | |
], | |
"text/plain": [ | |
" Name Code\n", | |
"0 Afghanistan AF\n", | |
"1 Åland Islands AX\n", | |
"2 Albania AL\n", | |
"3 Algeria DZ\n", | |
"4 American Samoa AS" | |
] | |
}, | |
"execution_count": 5, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"storage['data___data'].head()" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 6, | |
"metadata": { | |
"collapsed": true | |
}, | |
"outputs": [], | |
"source": [ | |
"datapackage.pull_datapackage('/tmp/test/datapackage.json', 'country_list', 'pandas', tables={\n", | |
" 'data': storage['data___data'],\n", | |
"})" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 7, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [ | |
{ | |
"name": "stdout", | |
"output_type": "stream", | |
"text": [ | |
"{\r\n", | |
" \"name\": \"country_list\",\r\n", | |
" \"resources\": [\r\n", | |
" {\r\n", | |
" \"schema\": {\r\n", | |
" \"fields\": [\r\n", | |
" {\r\n", | |
" \"name\": \"Name\",\r\n", | |
" \"type\": \"string\",\r\n", | |
" \"constraints\": {\r\n", | |
" \"required\": true\r\n", | |
" }\r\n", | |
" },\r\n", | |
" {\r\n", | |
" \"name\": \"Code\",\r\n", | |
" \"type\": \"string\",\r\n", | |
" \"constraints\": {\r\n", | |
" \"required\": true\r\n", | |
" }\r\n", | |
" }\r\n", | |
" ]\r\n", | |
" },\r\n", | |
" \"path\": \"data.csv\"\r\n", | |
" }\r\n", | |
" ]\r\n", | |
"}" | |
] | |
} | |
], | |
"source": [ | |
"!cat /tmp/test/datapackage.json" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 8, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [ | |
{ | |
"name": "stdout", | |
"output_type": "stream", | |
"text": [ | |
"Name,Code\r", | |
"\r\n", | |
"Afghanistan,AF\r", | |
"\r\n", | |
"Åland Islands,AX\r", | |
"\r\n", | |
"Albania,AL\r", | |
"\r\n", | |
"Algeria,DZ\r", | |
"\r\n", | |
"American Samoa,AS\r", | |
"\r\n", | |
"Andorra,AD\r", | |
"\r\n", | |
"Angola,AO\r", | |
"\r\n", | |
"Anguilla,AI\r", | |
"\r\n", | |
"Antarctica,AQ\r", | |
"\r\n" | |
] | |
} | |
], | |
"source": [ | |
"!head /tmp/test/data.csv" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 9, | |
"metadata": { | |
"collapsed": true | |
}, | |
"outputs": [], | |
"source": [ | |
"storage = datapackage.push_datapackage('http://data.okfn.org/data/core/country-codes/datapackage.json', 'pandas')" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 10, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/plain": [ | |
"['data__country_codes___country_codes']" | |
] | |
}, | |
"execution_count": 10, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"storage.tables" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 11, | |
"metadata": { | |
"collapsed": false | |
}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/html": [ | |
"<div>\n", | |
"<table border=\"1\" class=\"dataframe\">\n", | |
" <thead>\n", | |
" <tr style=\"text-align: right;\">\n", | |
" <th></th>\n", | |
" <th>0</th>\n", | |
" <th>1</th>\n", | |
" <th>2</th>\n", | |
" <th>3</th>\n", | |
" <th>4</th>\n", | |
" </tr>\n", | |
" </thead>\n", | |
" <tbody>\n", | |
" <tr>\n", | |
" <th>name</th>\n", | |
" <td>Afghanistan</td>\n", | |
" <td>Albania</td>\n", | |
" <td>Algeria</td>\n", | |
" <td>American Samoa</td>\n", | |
" <td>Andorra</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>name_fr</th>\n", | |
" <td>Afghanistan</td>\n", | |
" <td>Albanie</td>\n", | |
" <td>Algérie</td>\n", | |
" <td>Samoa Américaines</td>\n", | |
" <td>Andorre</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>ISO3166-1-Alpha-2</th>\n", | |
" <td>AF</td>\n", | |
" <td>AL</td>\n", | |
" <td>DZ</td>\n", | |
" <td>AS</td>\n", | |
" <td>AD</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>ISO3166-1-Alpha-3</th>\n", | |
" <td>AFG</td>\n", | |
" <td>ALB</td>\n", | |
" <td>DZA</td>\n", | |
" <td>ASM</td>\n", | |
" <td>AND</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>ISO3166-1-numeric</th>\n", | |
" <td>4</td>\n", | |
" <td>8</td>\n", | |
" <td>12</td>\n", | |
" <td>16</td>\n", | |
" <td>20</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>ITU</th>\n", | |
" <td>AFG</td>\n", | |
" <td>ALB</td>\n", | |
" <td>ALG</td>\n", | |
" <td>SMA</td>\n", | |
" <td>AND</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>MARC</th>\n", | |
" <td>af</td>\n", | |
" <td>aa</td>\n", | |
" <td>ae</td>\n", | |
" <td>as</td>\n", | |
" <td>an</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>WMO</th>\n", | |
" <td>AF</td>\n", | |
" <td>AB</td>\n", | |
" <td>AL</td>\n", | |
" <td></td>\n", | |
" <td></td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>DS</th>\n", | |
" <td>AFG</td>\n", | |
" <td>AL</td>\n", | |
" <td>DZ</td>\n", | |
" <td>USA</td>\n", | |
" <td>AND</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>Dial</th>\n", | |
" <td>93</td>\n", | |
" <td>355</td>\n", | |
" <td>213</td>\n", | |
" <td>1-684</td>\n", | |
" <td>376</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>FIFA</th>\n", | |
" <td>AFG</td>\n", | |
" <td>ALB</td>\n", | |
" <td>ALG</td>\n", | |
" <td>ASA</td>\n", | |
" <td>AND</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>FIPS</th>\n", | |
" <td>AF</td>\n", | |
" <td>AL</td>\n", | |
" <td>AG</td>\n", | |
" <td>AQ</td>\n", | |
" <td>AN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>GAUL</th>\n", | |
" <td>1</td>\n", | |
" <td>3</td>\n", | |
" <td>4</td>\n", | |
" <td>5</td>\n", | |
" <td>7</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>IOC</th>\n", | |
" <td>AFG</td>\n", | |
" <td>ALB</td>\n", | |
" <td>ALG</td>\n", | |
" <td>ASA</td>\n", | |
" <td>AND</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>currency_alphabetic_code</th>\n", | |
" <td>AFN</td>\n", | |
" <td>ALL</td>\n", | |
" <td>DZD</td>\n", | |
" <td>USD</td>\n", | |
" <td>EUR</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>currency_country_name</th>\n", | |
" <td>AFGHANISTAN</td>\n", | |
" <td>ALBANIA</td>\n", | |
" <td>ALGERIA</td>\n", | |
" <td>AMERICAN SAMOA</td>\n", | |
" <td>ANDORRA</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>currency_minor_unit</th>\n", | |
" <td>2</td>\n", | |
" <td>2</td>\n", | |
" <td>2</td>\n", | |
" <td>2</td>\n", | |
" <td>2</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>currency_name</th>\n", | |
" <td>Afghani</td>\n", | |
" <td>Lek</td>\n", | |
" <td>Algerian Dinar</td>\n", | |
" <td>US Dollar</td>\n", | |
" <td>Euro</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>currency_numeric_code</th>\n", | |
" <td>971</td>\n", | |
" <td>8</td>\n", | |
" <td>12</td>\n", | |
" <td>840</td>\n", | |
" <td>978</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>is_independent</th>\n", | |
" <td>Yes</td>\n", | |
" <td>Yes</td>\n", | |
" <td>Yes</td>\n", | |
" <td>Territory of US</td>\n", | |
" <td>Yes</td>\n", | |
" </tr>\n", | |
" </tbody>\n", | |
"</table>\n", | |
"</div>" | |
], | |
"text/plain": [ | |
" 0 1 2 \\\n", | |
"name Afghanistan Albania Algeria \n", | |
"name_fr Afghanistan Albanie Algérie \n", | |
"ISO3166-1-Alpha-2 AF AL DZ \n", | |
"ISO3166-1-Alpha-3 AFG ALB DZA \n", | |
"ISO3166-1-numeric 4 8 12 \n", | |
"ITU AFG ALB ALG \n", | |
"MARC af aa ae \n", | |
"WMO AF AB AL \n", | |
"DS AFG AL DZ \n", | |
"Dial 93 355 213 \n", | |
"FIFA AFG ALB ALG \n", | |
"FIPS AF AL AG \n", | |
"GAUL 1 3 4 \n", | |
"IOC AFG ALB ALG \n", | |
"currency_alphabetic_code AFN ALL DZD \n", | |
"currency_country_name AFGHANISTAN ALBANIA ALGERIA \n", | |
"currency_minor_unit 2 2 2 \n", | |
"currency_name Afghani Lek Algerian Dinar \n", | |
"currency_numeric_code 971 8 12 \n", | |
"is_independent Yes Yes Yes \n", | |
"\n", | |
" 3 4 \n", | |
"name American Samoa Andorra \n", | |
"name_fr Samoa Américaines Andorre \n", | |
"ISO3166-1-Alpha-2 AS AD \n", | |
"ISO3166-1-Alpha-3 ASM AND \n", | |
"ISO3166-1-numeric 16 20 \n", | |
"ITU SMA AND \n", | |
"MARC as an \n", | |
"WMO \n", | |
"DS USA AND \n", | |
"Dial 1-684 376 \n", | |
"FIFA ASA AND \n", | |
"FIPS AQ AN \n", | |
"GAUL 5 7 \n", | |
"IOC ASA AND \n", | |
"currency_alphabetic_code USD EUR \n", | |
"currency_country_name AMERICAN SAMOA ANDORRA \n", | |
"currency_minor_unit 2 2 \n", | |
"currency_name US Dollar Euro \n", | |
"currency_numeric_code 840 978 \n", | |
"is_independent Territory of US Yes " | |
] | |
}, | |
"execution_count": 11, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"storage['data__country_codes___country_codes'].head().T" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": null, | |
"metadata": { | |
"collapsed": true | |
}, | |
"outputs": [], | |
"source": [] | |
} | |
], | |
"metadata": { | |
"kernelspec": { | |
"display_name": "Python 3", | |
"language": "python", | |
"name": "python3" | |
}, | |
"language_info": { | |
"codemirror_mode": { | |
"name": "ipython", | |
"version": 3 | |
}, | |
"file_extension": ".py", | |
"mimetype": "text/x-python", | |
"name": "python", | |
"nbconvert_exporter": "python", | |
"pygments_lexer": "ipython3", | |
"version": "3.4.3" | |
} | |
}, | |
"nbformat": 4, | |
"nbformat_minor": 0 | |
} |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment