Rahul Agarwal MLWhiz

🤓

Focusing

Autodidact Data Scientist, Amateur Guitarist, Pessimistic Go-getter.

MLWhiz / pytorch_textcnn.py

Created March 9, 2019 15:00

	import torch
	import torch.nn as nn
	import torch.nn.functional as F
	from torch.autograd import Variable


	class CNN_Text(nn.Module):

	def __init__(self):
	super(CNN_Text, self).__init__()

MLWhiz / keras_textcnn.py

Created March 9, 2019 15:00

	# https://www.kaggle.com/yekenot/2dcnn-textclassifier
	def model_cnn(embedding_matrix):
	filter_sizes = [1,2,3,5]
	num_filters = 36

	inp = Input(shape=(maxlen,))
	x = Embedding(max_features, embed_size, weights=[embedding_matrix])(inp)
	x = Reshape((maxlen, embed_size, 1))(x)

	maxpool_pool = []

MLWhiz / pytorch_bilstm.py

Created March 9, 2019 15:01

	class BiLSTM(nn.Module):

	def __init__(self):
	super(BiLSTM, self).__init__()
	self.hidden_size = 64
	drp = 0.1
	self.embedding = nn.Embedding(max_features, embed_size)
	self.embedding.weight = nn.Parameter(torch.tensor(embedding_matrix, dtype=torch.float32))
	self.embedding.weight.requires_grad = False
	self.lstm = nn.LSTM(embed_size, self.hidden_size, bidirectional=True, batch_first=True)

MLWhiz / keras_bilstm.py

Created March 9, 2019 15:02

	# BiDirectional LSTM
	def model_lstm_du(embedding_matrix):
	inp = Input(shape=(maxlen,))
	x = Embedding(max_features, embed_size, weights=[embedding_matrix])(inp)
	'''
	Here 64 is the size(dim) of the hidden state vector as well as the output vector. Keeping return_sequence we want the output for the entire sequence. So what is the dimension of output for this layer?
	6470(maxlen)2(bidirection concat)
	CuDNNLSTM is fast implementation of LSTM layer in Keras which only runs on GPU
	'''
	x = Bidirectional(CuDNNLSTM(64, return_sequences=True))(x)

MLWhiz / pytorch_attention.py

Created March 9, 2019 15:03

	class Attention(nn.Module):
	def __init__(self, feature_dim, step_dim, bias=True, **kwargs):
	super(Attention, self).__init__(**kwargs)

	self.supports_masking = True

	self.bias = bias
	self.feature_dim = feature_dim
	self.step_dim = step_dim
	self.features_dim = 0

MLWhiz / keras_attention.py

Created March 9, 2019 15:04

	def dot_product(x, kernel):
	"""
	Wrapper for dot product operation, in order to be compatible with both
	Theano and Tensorflow
	Args:
	x (): input
	kernel (): weights
	Returns:
	"""
	if K.backend() == 'tensorflow':

MLWhiz / base_model.py

Created March 30, 2019 07:07

	# Language model data : We use test_df as validation for language model
	data_lm = TextLMDataBunch.from_df(path = "",train_df= train_df ,valid_df = test_df)
	learn = language_model_learner(data_lm, AWD_LSTM, drop_mult=0.5)

MLWhiz / finetune_base.py

Last active March 30, 2019 07:10

	# Learning with Discriminative fine tuning
	learn.fit_one_cycle(1, 1e-2)
	learn.unfreeze()
	learn.fit_one_cycle(1, 1e-3)
	# Save encoder Object
	learn.save_encoder('ft_enc')

MLWhiz / task_learning.py

Created March 30, 2019 07:11

	#Creating Classification Data
	data_clas = TextClasDataBunch.from_df(path ="", train_df=train, valid_df =valid, test_df=test_df, vocab=data_lm.train_ds.vocab, bs=32,label_cols = 'target')

	# Creating Classifier Object
	learn = text_classifier_learner(data_clas, AWD_LSTM, drop_mult=0.5)
	# Add weights of finetuned Language model
	learn.load_encoder('ft_enc')
	# Fitting Classifier Object
	learn.fit_one_cycle(1, 1e-2)
	# Fitting Classifier Object after freezing all but last 2 layers

MLWhiz / main.py

Created April 16, 2019 05:38

	#!/usr/bin/env python3

	import requests
	import time
	import argparse
	import os
	import json
	from requests.compat import urljoin

	class BotHandler(object):