Rohan Paul rohan-paul

🎯

Focusing

Machine Learning Engineer | Founder and writer of daily AI newsletter rohan-paul.com

rohan-paul / actor_loss_fn_deepspeed_rlhf_blog.py

Created July 4, 2024 22:18

	def actor_loss_fn(self, logprobs, old_logprobs, advantages, mask):
	## policy gradient loss
	log_ratio = (logprobs - old_logprobs) * mask
	ratio = torch.exp(log_ratio)
	pg_loss1 = -advantages * ratio
	pg_loss2 = -advantages * torch.clamp(ratio, 1.0 - self.cliprange,
	1.0 + self.cliprange)
	pg_loss = torch.sum(torch.max(pg_loss1, pg_loss2) * mask) / mask.sum()
	return pg_loss

rohan-paul / make_prompt.py

Created April 21, 2024 10:32

	# Usecase

	def make_prompt(input_text: str, system_prompt="", max_length=512) -> str:
	"""
	Generates text using a large language model, given a prompt and a device.
	Args:
	input_text (str): The input text for prompting.
	system_prompt (str): The system prompt (not used in the function).
	max_length (int): The maximum length of the generated text.

rohan-paul / Useful util method for generated text from LLM.py

Created April 21, 2024 10:30

	import random
	import textwrap
	import torch # You missed importing the torch module.
	device = 'cuda' if torch.cuda.is_available() else 'cpu'

	import textwrap

	def text_wrapper(text, width=90):
	# Wraps the input text to the specified width

rohan-paul / FineTune_Falcon-7b.py

Created October 15, 2023 23:06


	import torch
	from datasets import load_dataset
	from peft import LoraConfig
	from transformers import (
	AutoModelForCausalLM,
	AutoTokenizer,
	BitsAndBytesConfig,
	HfArgumentParser,
	TrainingArguments,

rohan-paul / FineTune_Llama_2.py

Created August 31, 2023 11:28

	import argparse
	import bitsandbytes as bnb
	from datasets import load_dataset
	from functools import partial
	import os
	from peft import LoraConfig, get_peft_model, prepare_model_for_kbit_training, AutoPeftModelForCausalLM
	import torch
	from transformers import AutoModelForCausalLM, AutoTokenizer, set_seed, Trainer, TrainingArguments, BitsAndBytesConfig, \
	DataCollatorForLanguageModeling, Trainer, TrainingArguments
	from datasets import load_dataset

rohan-paul / gradient.py

Created May 28, 2023 18:29

	def train_one_epoch(model, optimizer, scheduler, dataloader, device, epoch):
	model.train()

	dataset_size = 0
	running_loss = 0.0

	bar = tqdm(enumerate(dataloader), total=len(dataloader))
	""" The total argument in tqdm specifies the total number of iterations (or updates to the progress bar). In this case, len(dataloader) is used as the total which is the total number of batches in the dataloader. """
	for step, data in bar:
	ids = data['input_ids'].to(device, dtype = torch.long)

rohan-paul / custom_layer.py

Created November 17, 2021 05:47

	from tensorflow import keras
	import tensorflow as tf

	class ChildDense(keras.layers.Layer):

	def __init__(self, units, activation=None):
	super().__init__()
	self.units = units
	self.activation = activation

rohan-paul / yfinance.py

Created October 30, 2021 14:03

	from statsmodels.tsa.stattools import adfuller
	from statsmodels.tsa.seasonal import seasonal_decompose
	import statsmodels.api as sm
	from sklearn.metrics import mean_squared_error, mean_absolute_error
	import math

	#Test for staionarity
	def test_stationarity(timeseries):
	#Determing rolling statistics
	rolling_mean = timeseries.rolling(12).mean()

rohan-paul / multi_2.py

Created October 22, 2021 21:40

	# Now generate TPR, FPR and ROC data

	tpr,fpr,roc_auc = ([[]]*number_of_classes for _ in range(3))

	f,ax = plt.subplots()


	for i in range(number_of_classes):
	fpr[i], tpr[i], _ = roc_curve(labels==i, predictions[:, i])
	roc_auc[i] = auc(fpr[i], tpr[i])

rohan-paul / multi_1.py

Created October 22, 2021 21:35

	import numpy as np
	from sklearn.metrics import roc_auc_score
	from sklearn.metrics import roc_curve, auc
	import matplotlib.pyplot as plt

	#generating synthetic data
	number_of_classes = 5

	samples_per_class= 70