AJRenold · December 16, 2015 09:58 · iaperez · Apr 18, 2013 · iaperez · Apr 25, 2013
diff --git a/gistfile1.py b/gistfile1.py
 from bs4 import BeautifulSoup, NavigableString, Tag
 from urllib2 import urlopen
 import json

 def check_dbpedia(term):
    api = 'http://lookup.dbpedia.org/api/search.asmx/KeywordSearch?MaxHits=10&QueryString='
    #api = 'http://lookup.dbpedia.org/api/search.asmx/PrefixSearch?MaxHits=10&QueryString='
    response = urlopen(api+term)
    soup = BeautifulSoup(response.read())
    
    urls = []
    for result in soup.findAll('result'):
        for child in result.children:
            if isinstance(child,Tag):
                if child.name == 'label':
                    current_label = child.string
                if child.name == 'uri':
                    urls.append({ 'label': current_label, 'url': child.string })
    
    #print urls
    
    ## exact match
    found = ""
    for url in urls:
        if url['label'] == term:
            url['match'] = 'exact'
            found = url
    
    ## no exact match
    if found == "":
        found = urls[0:3]
        for url in found:
            url['match'] = 'partial'
        
    return found

 def wiki_url(url):

    term = url[url.rfind('/'):]
    
    entity_page = 'http://dbpedia.org/data/{}.json'.format(term)
    #print(entity_page)
    
    wiki_type = 'http://xmlns.com/foaf/0.1/primaryTopic'
    
    response = urlopen(entity_page)
    data = json.loads(response.read())
    for key,value in data.items():
        'http://xmlns.com/foaf/0.1/primaryTopic'
        #print("key",value)
        if 'http://xmlns.com/foaf/0.1/primaryTopic' in value:
            return key

 def get_wiki_url(term):
    
    results = check_dbpedia(term)
    #print results
    
    wikis = {}
    
    if type(results) == dict:
        wiki = wiki_url(results['url'])
        wikis['urls'] = [wiki]
        wikis['match'] = 'exact'
    
    elif len(results) == 0:
        wikis['match'] = 'none'
    
    else:
        wikis['match'] = 'partial'
        wikis['urls'] = []
        for result in results:
            wiki = wiki_url(result['url'])
            wikis['urls'].append(wiki)
            
    return wikis
    
 urls = get_wiki_url('HTTP')
	from bs4 import BeautifulSoup, NavigableString, Tag
	from urllib2 import urlopen
	import json

	def check_dbpedia(term):
	api = 'http://lookup.dbpedia.org/api/search.asmx/KeywordSearch?MaxHits=10&QueryString='
	#api = 'http://lookup.dbpedia.org/api/search.asmx/PrefixSearch?MaxHits=10&QueryString='
	response = urlopen(api+term)
	soup = BeautifulSoup(response.read())

	urls = []
	for result in soup.findAll('result'):
	for child in result.children:
	if isinstance(child,Tag):
	if child.name == 'label':
	current_label = child.string
	if child.name == 'uri':
	urls.append({ 'label': current_label, 'url': child.string })

	#print urls

	## exact match
	found = ""
	for url in urls:
	if url['label'] == term:
	url['match'] = 'exact'
	found = url

	## no exact match
	if found == "":
	found = urls[0:3]
	for url in found:
	url['match'] = 'partial'

	return found

	def wiki_url(url):

	term = url[url.rfind('/'):]

	entity_page = 'http://dbpedia.org/data/{}.json'.format(term)
	#print(entity_page)

	wiki_type = 'http://xmlns.com/foaf/0.1/primaryTopic'

	response = urlopen(entity_page)
	data = json.loads(response.read())
	for key,value in data.items():
	'http://xmlns.com/foaf/0.1/primaryTopic'
	#print("key",value)
	if 'http://xmlns.com/foaf/0.1/primaryTopic' in value:
	return key

	def get_wiki_url(term):

	results = check_dbpedia(term)
	#print results

	wikis = {}

	if type(results) == dict:
	wiki = wiki_url(results['url'])
	wikis['urls'] = [wiki]
	wikis['match'] = 'exact'

	elif len(results) == 0:
	wikis['match'] = 'none'

	else:
	wikis['match'] = 'partial'
	wikis['urls'] = []
	for result in results:
	wiki = wiki_url(result['url'])
	wikis['urls'].append(wiki)

	return wikis

	urls = get_wiki_url('HTTP')