William Falcon williamFalcon

🎯

Focusing

PyTorch Lightning Creator. CEO @Lightning-AI . AI PhD Researcher @nyu. Former @facebookresearch, Goldman Sachs, Columbia, NextGenVest (co-founder, acquired)

2.4k followers · 2 following

Lightning AI
New York City, NY
https://lightning.ai
@_willfalcon

View GitHub Profile

Recently created

Least recently created

Recently updated

Least recently updated

williamFalcon / 9t_12.py

Created July 29, 2019 17:51

	class MyModule(LightningModule):
	def __init__():
	self.encoder = RNN(...)
	self.decoder = RNN(...)
	def forward(x):
	# models won't be moved after the first forward because
	# they are already on the correct GPUs
	self.encoder.cuda(0)
	self.decoder.cuda(1)
	out = self.encoder(x)

williamFalcon / 9t_13.py

Created July 29, 2019 17:51

	# change these lines
	self.encoder = RNN(...)
	self.decoder = RNN(...)

	# to these
	# now each RNN is based on a different gpu set
	self.encoder = DataParallel(self.encoder, devices=[0, 1, 2, 3])
	self.decoder = DataParallel(self.encoder, devices=[4, 5, 6, 7])

	# in forward...

williamFalcon / 9t_14.py

Created July 29, 2019 17:52

	def tng_dataloader():
	d = MNIST()

	# 4: Add distributed sampler
	# sampler sends a portion of tng data to each machine
	dist_sampler = DistributedSampler(dataset)
	dataloader = DataLoader(d, shuffle=False, sampler=dist_sampler)

	def main_process_entrypoint(gpu_nb):
	# 2: set up connections between all gpus across all machines

williamFalcon / 9t_15.py

Created July 29, 2019 17:52

	# train on 1024 gpus across 128 nodes
	trainer = Trainer(nb_gpu_nodes=128, gpus=[0, 1, 2, 3, 4, 5, 6, 7])

williamFalcon / 9t_16.py

Created July 29, 2019 17:53

	# train on 4 gpus on the same machine MUCH faster than DataParallel
	trainer = Trainer(distributed_backend='ddp', gpus=[0, 1, 2, 3])

williamFalcon / cl_1.py

Created August 3, 2019 12:37

	import os
	import torch
	from torch.nn import functional as F
	from torch.utils.data import DataLoader
	from torchvision.datasets import MNIST
	import torchvision.transforms as transforms

	import pytorch_lightning as ptl

	class CoolModel(ptl.LightningModule):

williamFalcon / cl_2.py

Last active August 3, 2019 12:46

	from pytorch_lightning import Trainer
	from test_tube import Experiment

	model = CoolModel()
	exp = Experiment(save_dir=os.getcwd())

	# train on cpu using only 10% of the data and limit to 1 epoch (for demo purposes)
	trainer = Trainer(experiment=exp, max_nb_epochs=1, train_percent_check=0.1)

	trainer.fit(model)

williamFalcon / cl_3.py

Created August 3, 2019 12:45

	trainer = Trainer(experiment=exp, max_nb_epochs=1, gpus=[0])
	trainer.fit(model)

williamFalcon / cl_4.py

Created August 3, 2019 12:47

	trainer = Trainer(experiment=exp, max_nb_epochs=1, gpus=[0, 1, 2, 3])
	trainer.fit(model)

williamFalcon / cl_5.py

Created August 3, 2019 12:51

	from pytorch_lightning import Trainer
	from test_tube import Experiment

	# RUN THIS SCRIPT ON A MACHINE WITH THE IDs OF THE AVAILABLE GPUS

	def main():
	model = CoolModel()
	exp = Experiment(save_dir=os.getcwd())

	trainer = Trainer(experiment=exp, max_nb_epochs=1, gpus=[0, 1, 2, 3])

Older Newer