stevenpollack · April 25, 2016 14:13
diff --git a/async_crawl.py b/async_crawl.py
 def crawl(self, current_page):
    # modifies various attributes of self depending on the
    # html in current_page and returns nothing.

 @coroutine
 def coro(current_page):
    # either return a future of the body of the "next" page or None
    next_page_url = next_page_link(current_page)
    if next_page_url is None:
        yield None
    yield async_fetch(next_page_url).body

 next_page = fetch_url("http://google.com/movies?near=Berlin")
 while next_page:
    current_page = next_page
    next_page_future = coro(current_page)
    next_page_future.add_done_callback(lambda f: next_page = f.result())
    parse(self, current_page)
	def crawl(self, current_page):
	# modifies various attributes of self depending on the
	# html in current_page and returns nothing.

	@coroutine
	def coro(current_page):
	# either return a future of the body of the "next" page or None
	next_page_url = next_page_link(current_page)
	if next_page_url is None:
	yield None
	yield async_fetch(next_page_url).body

	next_page = fetch_url("http://google.com/movies?near=Berlin")
	while next_page:
	current_page = next_page
	next_page_future = coro(current_page)
	next_page_future.add_done_callback(lambda f: next_page = f.result())
	parse(self, current_page)
No results found