Shamane Siri shamanez

🥳

Energetic

Principal Applied Scientist | Ph.D. in NLP

shamanez / distributed_ray_retriever.py

Last active November 14, 2024 04:21

	import logging
	import random

	import ray
	from transformers import RagConfig, RagRetriever, RagTokenizer
	from transformers.file_utils import requires_datasets, requires_faiss
	from transformers.models.rag.retrieval_rag import CustomHFIndex

	from transformers import (
	DPRContextEncoderTokenizerFast)

shamanez / finetune-3.py

Last active April 21, 2021 12:47

	if isOtherThreadIndexBusy:

	if not threadHandle_index.is_alive():

	saved_dataset_shards=[]
	for address in data_shard_addressses:
	saved_dataset_shards.append(load_from_disk(address))

	concat=concatenate_datasets(saved_dataset_shards)
	concat.save_to_disk(self.config.passages_path)

shamanez / finetune-2.py

Last active April 16, 2021 04:40

	def training_step(self, batch, batch_idx) -> Dict:

	global stepCount
	global isEmUpdateBusy
	global isAddIndexBusy
	global processes
	global isOtherThreadIndexBusy


	if (self.trainer.global_rank==0): #we initialize the embedding computing parrele process only on master DDP.

shamanez / finetune-1.py

Last active April 21, 2021 13:09

	#check training_step hook in pytorch-lightning for further details in the function.
	def training_step(self, batch, batch_idx) -> Dict:

	global isEmUpdateBusy #global variable used in the parrelle process of embeddings computation

	if (self.trainer.global_rank==0): #we initialize the embedding computing parrele process only on master DDP.
	if (not batch_idx==0) and (batch_idx%500==0): #We want our embeddings to get updated in every 500th step

	######we can assign any number of free GPUs to update the embeddings (optional)##########
	free_gpu_list=[]

shamanez / pg-pong.py

Created December 4, 2017 07:00 — forked from karpathy/pg-pong.py

Training a Neural Network ATARI Pong agent with Policy Gradients from raw pixels

	""" Trains an agent with (stochastic) Policy Gradients on Pong. Uses OpenAI Gym. """
	import numpy as np
	import cPickle as pickle
	import gym

	# hyperparameters
	H = 200 # number of hidden layer neurons
	batch_size = 10 # every how many episodes to do a param update?
	learning_rate = 1e-4
	gamma = 0.99 # discount factor for reward