dpoulopoulos · February 26, 2020 09:42
diff --git a/nmf_1.py b/nmf_1.py
 import pandas as pd

 # load Wikipedia Movie Plots Dataset
 df = pd.read_csv('wiki_plots.csv')
 # load the English names dataset
 names_df = pd.read_csv('first_names.all.txt', names=['names'], header=0)
 # keep only the relevant columns
 df = df[['Title', 'Plot']]
 # sample 50% of the movies
 df = df.sample(frac=.5)
 # visualise the dataset
 df.head()
	import pandas as pd

	# load Wikipedia Movie Plots Dataset
	df = pd.read_csv('wiki_plots.csv')
	# load the English names dataset
	names_df = pd.read_csv('first_names.all.txt', names=['names'], header=0)
	# keep only the relevant columns
	df = df[['Title', 'Plot']]
	# sample 50% of the movies
	df = df.sample(frac=.5)
	# visualise the dataset
	df.head()
No results found