obswork · December 31, 2018 18:10
diff --git a/gistfile1.txt b/gistfile1.txt
 """Steps:
 (1) You'll first need to open up the developer console in e.g. Chrome (cmd-shift-c)
 (2) Locate the div element with id "main" (should be relatively easy to find as it's the main enclosing div in the body)
 (3) Copy all the inner html of that div (easy way- right-click and select "Edit as HTML", then copy normally)
 (4) Save that to a file somewhere (e.g. /tmp/tracklist.html)
 (5) Open up a python shell (preferably iPython!) and paste the function below into it
 (6) Call the function passing in the path to the file from step 4
 (7) profit
 """

 def extract_tracks(file):
    """Returns tracks from a Spotify playlist
    
    :param file: Path to an html file with a single-enclosing DOM element
    :type file: string
    """
    import lxml.html

    # read in the file from wherever it is saved
    with open('/tmp/tracklist.html', 'r') as f:
       html = f.read()   

    # convert the html blob into an lxml tree
    tree = lxml.html.fragment_fromstring(html)

    # grab all the songs
    songs = tree.xpath("//div[contains(concat(' ', normalize-space(@class), ' '),' tracklist-name ')]")

    # grab all the artist/album info
    metadata = tree.xpath("//div[contains(concat(' ', normalize-space(@class), ' '),' second-line ')]")

    extracted_songs = []
    
    # zip the songs and metadata together, clean up the results a little, and spit them out
    for s, m in zip(songs, metadata):
        meta = m.text_content()[8:] if "Explicit" in m.text_content() else m.text_content()
        meta = meta.replace('•', '/')
        extracted_songs.append("%s - %s" % (s.text, meta))
    return extracted_songs
	"""Steps:
	(1) You'll first need to open up the developer console in e.g. Chrome (cmd-shift-c)
	(2) Locate the div element with id "main" (should be relatively easy to find as it's the main enclosing div in the body)
	(3) Copy all the inner html of that div (easy way- right-click and select "Edit as HTML", then copy normally)
	(4) Save that to a file somewhere (e.g. /tmp/tracklist.html)
	(5) Open up a python shell (preferably iPython!) and paste the function below into it
	(6) Call the function passing in the path to the file from step 4
	(7) profit
	"""

	def extract_tracks(file):
	"""Returns tracks from a Spotify playlist

	:param file: Path to an html file with a single-enclosing DOM element
	:type file: string
	"""
	import lxml.html

	# read in the file from wherever it is saved
	with open('/tmp/tracklist.html', 'r') as f:
	html = f.read()

	# convert the html blob into an lxml tree
	tree = lxml.html.fragment_fromstring(html)

	# grab all the songs
	songs = tree.xpath("//div[contains(concat(' ', normalize-space(@class), ' '),' tracklist-name ')]")

	# grab all the artist/album info
	metadata = tree.xpath("//div[contains(concat(' ', normalize-space(@class), ' '),' second-line ')]")

	extracted_songs = []

	# zip the songs and metadata together, clean up the results a little, and spit them out
	for s, m in zip(songs, metadata):
	meta = m.text_content()[8:] if "Explicit" in m.text_content() else m.text_content()
	meta = meta.replace('•', '/')
	extracted_songs.append("%s - %s" % (s.text, meta))
	return extracted_songs