Skip to content

Instantly share code, notes, and snippets.

@ksv-muralidhar
ksv-muralidhar / 1.py
Last active March 30, 2021 08:52
smote
import numpy as np
import pandas as pd
from sklearn.linear_model import LogisticRegression
from sklearn.model_selection import train_test_split, GridSearchCV, StratifiedKFold
from sklearn.preprocessing import MinMaxScaler
from imblearn.over_sampling import SMOTE
from imblearn.pipeline import Pipeline as imbpipeline
from sklearn.pipeline import Pipeline
from sklearn.datasets import make_classification, load_breast_cancer
@ksv-muralidhar
ksv-muralidhar / ct1.py
Last active May 5, 2023 11:01
Custom Transformer
import pandas as pd
import numpy as np
from sklearn.base import BaseEstimator,TransformerMixin
from sklearn.compose import ColumnTransformer
from sklearn.preprocessing import FunctionTransformer
from sklearn.datasets import load_iris
from sklearn.model_selection import GridSearchCV
from sklearn.pipeline import Pipeline
from sklearn.impute import SimpleImputer
from sklearn.linear_model import LogisticRegression
@ksv-muralidhar
ksv-muralidhar / ct1.py
Created February 25, 2021 16:49
Custom Transformers
import pandas as pd
import numpy as np
from sklearn.base import BaseEstimator,TransformerMixin
from sklearn.compose import ColumnTransformer
from sklearn.preprocessing import FunctionTransformer
from sklearn.datasets import load_iris
from sklearn.model_selection import GridSearchCV
from sklearn.pipeline import Pipeline
from sklearn.impute import SimpleImputer
from sklearn.linear_model import LogisticRegression
@ksv-muralidhar
ksv-muralidhar / dl1.py
Last active February 21, 2021 17:14
data leakage
import numpy as np
import pandas as pd
from sklearn.datasets import load_boston
from sklearn.preprocessing import StandardScaler
from sklearn.pipeline import Pipeline
from sklearn.impute import SimpleImputer
from sklearn.neighbors import KNeighborsRegressor
from sklearn.model_selection import cross_validate, train_test_split
from sklearn.metrics import mean_squared_error
@ksv-muralidhar
ksv-muralidhar / k1.py
Last active February 20, 2021 14:02
kaggle survey 2020
import numpy as np
import pandas as pd
from apyori import apriori
from termcolor import colored
data = pd.read_csv("../input/kaggle-survey-2020/kaggle_survey_2020_responses.csv",header=1)
@ksv-muralidhar
ksv-muralidhar / cv_1.py
Last active February 17, 2021 13:22
cross val
import pandas as pd
from sklearn.model_selection import train_test_split,StratifiedKFold,cross_validate
from sklearn.datasets import load_iris
from sklearn.linear_model import LogisticRegression
from sklearn.metrics import accuracy_score
@ksv-muralidhar
ksv-muralidhar / pipe_1.py
Last active February 17, 2021 11:39
Pipeline
from sklearn.compose import ColumnTransformer
@ksv-muralidhar
ksv-muralidhar / hist_1.py
Last active February 16, 2021 12:45
histogram bins
fig,ax = plt.subplots(2,3,figsize=(15,10))
row = col = 0
np.random.seed(11)
norm_dist = np.random.randn(1000)
for n,i in enumerate(np.linspace(5,100,6)):
if (n>0) & (n%3==0):
row += 1
col = 0
sns.histplot(x=norm_dist,bins=int(i),ax=ax[row,col])
ax[row,col].set_title(f'bins = {int(i)}')
@ksv-muralidhar
ksv-muralidhar / api_1.py
Created February 16, 2021 07:11
API data extraction
import requests
import pandas as pd
from IPython.display import display
@ksv-muralidhar
ksv-muralidhar / learning_curve_1.py
Created February 16, 2021 05:52
Learning Curve
from sklearn.model_selection import learning_curve