slopp · December 23, 2024 20:17
diff --git a/ReadMe.md b/ReadMe.md
diff --git a/r_get_started_to_py.py b/r_get_started_to_py.py
 import modal as md
 import time
 import pathlib
 import requests
 import zipfile
 from PIL import Image
 import os
 from torch.utils.data import Dataset, DataLoader
 from torchvision import transforms
 import pandas as pd
 import torch.nn as nn
 import torch.optim as optim
 from torch import relu, Tensor, tensor, mean, cuda
 import torch

 # Setup modal stuff
 app = md.App("torch-get-started-py")

 my_image = md.Image.debian_slim(python_version="3.10").pip_install(
    "requests", "torch==2.5.1", "torchvision==0.20.1", "pandas"
 )

 # pro-tip: modal volume ls my-volume extracted/trainings to interact locally
 volume = md.Volume.from_name("my-volume", create_if_missing=True)
 p = pathlib.Path("/root/data/")


 # functions to download and unzip from Posit's CDN copy of the kaggle dataset
 @app.function(volumes={"/root/data": volume}, image=my_image)
 def get_dataset():
    """Download the raw zip to the volume"""
    dataset = "https://torch-cdn.mlverse.org/datasets/guess-the-correlation.zip"
    try:
        response = requests.get(dataset, stream=True)
        response.raise_for_status()

        with open(p.joinpath(pathlib.Path("data.zip")), "wb") as file:
            for chunk in response.iter_content(chunk_size=8192):
                file.write(chunk)

        print(f"ZIP file downloaded successfully and saved to data.zip")
        volume.commit()
    except requests.exceptions.RequestException as e:
        print(f"An error occurred: {e}")


 @app.function(volumes={"/root/data": volume}, image=my_image)
 def unzip():
    """Unzip the top-level dataset which creates metadata files and a zip image dir"""
    with zipfile.ZipFile(p.joinpath(pathlib.Path("data.zip"))) as zip_ref:
        zip_ref.extractall(p.joinpath(pathlib.Path("extracted")))
    volume.commit()


 @app.function(volumes={"/root/data": volume}, image=my_image)
 def unzip_train():
    """Unzip the image dir into individual training images"""
    with zipfile.ZipFile(
        p.joinpath(
            pathlib.Path("extracted"),
            pathlib.Path("train_imgs.zip"),
        )
    ) as zip_ref:
        zip_ref.extractall(p.joinpath(pathlib.Path("extracted/training")))
    volume.commit()


 class GuessCorrelationDataset(Dataset):
    def __init__(self, p: pathlib.Path):
        self.p = p  # the directory to the dataset extract, eg /root/data/extracted
        self.img_path = self.p.joinpath(pathlib.Path("training/train_imgs"))
        self.files = os.listdir(self.img_path)
        self.train_metadata = pd.read_csv(self.p.joinpath(pathlib.Path("train.csv")))

    def __len__(self):
        return 64 * 30  # do n batches of 64 images

    def __getitem__(self, idx):
        """
        Load an individual image as a tensor, plus the correlation label into a dict
            idx: numeric id, eg get the 1st value from the list of image paths
        Returns a dict with:
            id: the actual image id
            corr: the true correlation depicted in the image as a tensor
            tensor: the tensor representation of the grayscale image
        """
        img = Image.open(self.img_path.joinpath(pathlib.Path(self.files[idx]))).convert(
            "RGB"
        )
        transform = transforms.ToTensor()
        rgb_img = transform(img)
        to_grayscale = transforms.Grayscale(num_output_channels=1)
        img_grayscale = to_grayscale(rgb_img)
        id = self.files[idx]
        corr = float(self.train_metadata.iloc[idx]["corr"])
        corr = tensor(corr)
        return {"x": img_grayscale, "id": id, "corr": corr}


 class myCNN(nn.Module):
    def __init__(self):
        super(myCNN, self).__init__()
        # 1 convolutional layer, input channels = 1 (grayscale), output channels = 32, kernel size = 3
        self.conv1 = nn.Conv2d(in_channels=1, out_channels=32, kernel_size=3)

        # a fully connected layer for the output
        self.fc = nn.Linear(
            32 * 148 * 148, 64
        )  # The input image size is 150 x 150, but padding brings to 148 x 148, second arg (64) is batch size

    def forward(self, x):
        x = self.conv1(x)  # Apply convolution
        x = relu(x)  # Apply ReLU activation
        # print(f"The shape after the convulution layer is: {x.shape}")
        x = x.view(
            64,
            -1,  # -1 here means "view figure out what size this needs to be"
        )  # flatten it to the shape [batch_size, linear input of 148x148x32]
        # print(f"The shape after the reshaping is: {x.shape}")
        x = self.fc(x)  # Fully connected layer
        return x


 @app.function(
    volumes={"/root/data": volume}, image=my_image, gpu="L40S"
 )  # comment out the gpu bit here to remove the gpu
 def train_my_cnn():
    device = torch.device("cuda" if cuda.is_available() else "cpu")
    print(f"Using device: {device}")
    dataset = GuessCorrelationDataset(p=pathlib.Path("/root/data/extracted"))
    dataloader = DataLoader(dataset=dataset, batch_size=64)
    model = myCNN().to(device=device)

    # Just some testing / printing going on here
    for batch in dataloader:
        first_batch = batch
        break

    first_tensors: Tensor = first_batch["x"].to(device)
    true_corrs: Tensor = first_batch["corr"].to(device)
    model_output_no_training = model(first_tensors)

    print(f"Test model output with no training: {model_output_no_training}")
    print(f"True values: {true_corrs}")
    mse = mean((model_output_no_training - true_corrs) ** 2)
    print(f"MSE with no training: {mse}")

    # Begin Training
    criterion = nn.MSELoss()  # use mse sincse this is a regression problem basically
    optimizer = optim.Adam(model.parameters(), lr=0.001)
    model.train()  # Set the model to training mode

    b = 0
    for batch in dataloader:
        b += 1
        print(f"BATCH: {b}")
        inputs = batch["x"].to(device)
        true_values = batch["corr"].to(device)

        # Zero the gradients
        optimizer.zero_grad()

        # Forward pass
        outputs = model(inputs)

        # Calculate the loss
        loss = criterion(outputs, true_values)

        # Backward pass and optimize
        loss.backward()
        optimizer.step()

        # Print the statistics after each batch
        print(f"Current loss is: {loss.item()}")

    print(f"MSE at start: {mse}")

    model_output_with_training = model(first_tensors)
    mse = mean((model_output_with_training - true_corrs) ** 2)

    print(f"MSE at end: {mse}")


 @app.local_entrypoint()
 def main():
    print("Getting started")
    start_time = time.time()
    # get_dataset.remote()
    # unzip.remote()
    # unzip_train.remote()
    train_my_cnn.remote()
    end_time = time.time()
    print(f"Took {end_time - start_time} seconds")
	import modal as md
	import time
	import pathlib
	import requests
	import zipfile
	from PIL import Image
	import os
	from torch.utils.data import Dataset, DataLoader
	from torchvision import transforms
	import pandas as pd
	import torch.nn as nn
	import torch.optim as optim
	from torch import relu, Tensor, tensor, mean, cuda
	import torch

	# Setup modal stuff
	app = md.App("torch-get-started-py")

	my_image = md.Image.debian_slim(python_version="3.10").pip_install(
	"requests", "torch==2.5.1", "torchvision==0.20.1", "pandas"
	)

	# pro-tip: modal volume ls my-volume extracted/trainings to interact locally
	volume = md.Volume.from_name("my-volume", create_if_missing=True)
	p = pathlib.Path("/root/data/")


	# functions to download and unzip from Posit's CDN copy of the kaggle dataset
	@app.function(volumes={"/root/data": volume}, image=my_image)
	def get_dataset():
	"""Download the raw zip to the volume"""
	dataset = "https://torch-cdn.mlverse.org/datasets/guess-the-correlation.zip"
	try:
	response = requests.get(dataset, stream=True)
	response.raise_for_status()

	with open(p.joinpath(pathlib.Path("data.zip")), "wb") as file:
	for chunk in response.iter_content(chunk_size=8192):
	file.write(chunk)

	print(f"ZIP file downloaded successfully and saved to data.zip")
	volume.commit()
	except requests.exceptions.RequestException as e:
	print(f"An error occurred: {e}")


	@app.function(volumes={"/root/data": volume}, image=my_image)
	def unzip():
	"""Unzip the top-level dataset which creates metadata files and a zip image dir"""
	with zipfile.ZipFile(p.joinpath(pathlib.Path("data.zip"))) as zip_ref:
	zip_ref.extractall(p.joinpath(pathlib.Path("extracted")))
	volume.commit()


	@app.function(volumes={"/root/data": volume}, image=my_image)
	def unzip_train():
	"""Unzip the image dir into individual training images"""
	with zipfile.ZipFile(
	p.joinpath(
	pathlib.Path("extracted"),
	pathlib.Path("train_imgs.zip"),
	)
	) as zip_ref:
	zip_ref.extractall(p.joinpath(pathlib.Path("extracted/training")))
	volume.commit()


	class GuessCorrelationDataset(Dataset):
	def __init__(self, p: pathlib.Path):
	self.p = p # the directory to the dataset extract, eg /root/data/extracted
	self.img_path = self.p.joinpath(pathlib.Path("training/train_imgs"))
	self.files = os.listdir(self.img_path)
	self.train_metadata = pd.read_csv(self.p.joinpath(pathlib.Path("train.csv")))

	def __len__(self):
	return 64 * 30 # do n batches of 64 images

	def __getitem__(self, idx):
	"""
	Load an individual image as a tensor, plus the correlation label into a dict
	idx: numeric id, eg get the 1st value from the list of image paths
	Returns a dict with:
	id: the actual image id
	corr: the true correlation depicted in the image as a tensor
	tensor: the tensor representation of the grayscale image
	"""
	img = Image.open(self.img_path.joinpath(pathlib.Path(self.files[idx]))).convert(
	"RGB"
	)
	transform = transforms.ToTensor()
	rgb_img = transform(img)
	to_grayscale = transforms.Grayscale(num_output_channels=1)
	img_grayscale = to_grayscale(rgb_img)
	id = self.files[idx]
	corr = float(self.train_metadata.iloc[idx]["corr"])
	corr = tensor(corr)
	return {"x": img_grayscale, "id": id, "corr": corr}


	class myCNN(nn.Module):
	def __init__(self):
	super(myCNN, self).__init__()
	# 1 convolutional layer, input channels = 1 (grayscale), output channels = 32, kernel size = 3
	self.conv1 = nn.Conv2d(in_channels=1, out_channels=32, kernel_size=3)

	# a fully connected layer for the output
	self.fc = nn.Linear(
	32 * 148 * 148, 64
	) # The input image size is 150 x 150, but padding brings to 148 x 148, second arg (64) is batch size

	def forward(self, x):
	x = self.conv1(x) # Apply convolution
	x = relu(x) # Apply ReLU activation
	# print(f"The shape after the convulution layer is: {x.shape}")
	x = x.view(
	64,
	-1, # -1 here means "view figure out what size this needs to be"
	) # flatten it to the shape [batch_size, linear input of 148x148x32]
	# print(f"The shape after the reshaping is: {x.shape}")
	x = self.fc(x) # Fully connected layer
	return x


	@app.function(
	volumes={"/root/data": volume}, image=my_image, gpu="L40S"
	) # comment out the gpu bit here to remove the gpu
	def train_my_cnn():
	device = torch.device("cuda" if cuda.is_available() else "cpu")
	print(f"Using device: {device}")
	dataset = GuessCorrelationDataset(p=pathlib.Path("/root/data/extracted"))
	dataloader = DataLoader(dataset=dataset, batch_size=64)
	model = myCNN().to(device=device)

	# Just some testing / printing going on here
	for batch in dataloader:
	first_batch = batch
	break

	first_tensors: Tensor = first_batch["x"].to(device)
	true_corrs: Tensor = first_batch["corr"].to(device)
	model_output_no_training = model(first_tensors)

	print(f"Test model output with no training: {model_output_no_training}")
	print(f"True values: {true_corrs}")
	mse = mean((model_output_no_training - true_corrs) ** 2)
	print(f"MSE with no training: {mse}")

	# Begin Training
	criterion = nn.MSELoss() # use mse sincse this is a regression problem basically
	optimizer = optim.Adam(model.parameters(), lr=0.001)
	model.train() # Set the model to training mode

	b = 0
	for batch in dataloader:
	b += 1
	print(f"BATCH: {b}")
	inputs = batch["x"].to(device)
	true_values = batch["corr"].to(device)

	# Zero the gradients
	optimizer.zero_grad()

	# Forward pass
	outputs = model(inputs)

	# Calculate the loss
	loss = criterion(outputs, true_values)

	# Backward pass and optimize
	loss.backward()
	optimizer.step()

	# Print the statistics after each batch
	print(f"Current loss is: {loss.item()}")

	print(f"MSE at start: {mse}")

	model_output_with_training = model(first_tensors)
	mse = mean((model_output_with_training - true_corrs) ** 2)

	print(f"MSE at end: {mse}")


	@app.local_entrypoint()
	def main():
	print("Getting started")
	start_time = time.time()
	# get_dataset.remote()
	# unzip.remote()
	# unzip_train.remote()
	train_my_cnn.remote()
	end_time = time.time()
	print(f"Took {end_time - start_time} seconds")