fadur · February 28, 2011 19:37
diff --git a/strip_html.py b/strip_html.py
 import re
 import urllib


 """
    strip html tags from a webpage
    need's regex to remove js too
 """

 url = ''
 def strip_tags(url):
    link = urllib.urlopen(url)
    data = link.read()
    stripped = re.compile(r'<[^<]*?/?>')
    content = stripped.sub('', data)
    return content
        
        
 print strip_tags(url)
	import re
	import urllib


	"""
	strip html tags from a webpage
	need's regex to remove js too
	"""

	url = ''
	def strip_tags(url):
	link = urllib.urlopen(url)
	data = link.read()
	stripped = re.compile(r'<[^<]*?/?>')
	content = stripped.sub('', data)
	return content


	print strip_tags(url)
No results found