pedrohbtp · December 11, 2018 13:40
diff --git a/pytorch_dataset_example.py b/pytorch_dataset_example.py
 import torch
 import pandas as pd
 from torch.utils.data import Dataset, DataLoader

 class ExampleDataset(Dataset):
    """Example Dataset"""

    def __init__(self, csv_file):
        """ 
        csv_file (string): Path to the csv file containing data.
        """
        self.data_frame = pd.read_csv(csv_file)

    def __len__(self):
        return len(self.data_frame)

    def __getitem__(self, idx):
        return self.data_frame[idx]

 # instantiates the dataset  
 example_dataset = ExampleDataset('my_data_file.csv')

 # batch size: number of samples returned per iteration
 # shuffle: Flag to shuffle the data before reading so you don't read always in the same order
 # num_workers: used to load the data in parallel
 example_data_loader = DataLoader(example_dataset, , batch_size=4, shuffle=True, num_workers=4)

 # Loops over the data 4 samples at a time
 for batch_index, batch in enumerate(example_data_loader):
    print(batch_index, batch)
	import torch
	import pandas as pd
	from torch.utils.data import Dataset, DataLoader

	class ExampleDataset(Dataset):
	"""Example Dataset"""

	def __init__(self, csv_file):
	"""
	csv_file (string): Path to the csv file containing data.
	"""
	self.data_frame = pd.read_csv(csv_file)

	def __len__(self):
	return len(self.data_frame)

	def __getitem__(self, idx):
	return self.data_frame[idx]

	# instantiates the dataset
	example_dataset = ExampleDataset('my_data_file.csv')

	# batch size: number of samples returned per iteration
	# shuffle: Flag to shuffle the data before reading so you don't read always in the same order
	# num_workers: used to load the data in parallel
	example_data_loader = DataLoader(example_dataset, , batch_size=4, shuffle=True, num_workers=4)

	# Loops over the data 4 samples at a time
	for batch_index, batch in enumerate(example_data_loader):
	print(batch_index, batch)