This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
import argparse | |
from itertools import chain | |
import evaluate | |
from datasets import load_dataset | |
from transformers import AutoTokenizer, AutoModelForMaskedLM, Trainer, TrainingArguments, DataCollatorForLanguageModeling | |
if __name__ == "__main__": |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
import os | |
import json | |
from typing import Optional, Any, Union, Dict | |
import mlflow | |
from transformers import TrainingArguments | |
from accelerate.tracking import GeneralTracker | |
from accelerate.logging import get_logger |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
# Generic LM | |
roberta-base | |
roberta-large | |
microsoft/deberta-v3-base | |
microsoft/deberta-v3-large | |
microsoft/deberta-v3-xsmall | |
# Long LM | |
allenai/longformer-base-4096 | |
google/bigbird-roberta-base |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
function SUMMARIZE(input, repo_id="google/pegasus-xsum", use_gpu=false) { | |
// other models to consider | |
// short sequences | |
// sshleifer/distilbart-cnn-12-6 | |
// knkarthick/MEETING_SUMMARY | |
// long sequences | |
// google/bigbird-pegasus-large-bigpatent |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
import torch | |
from torch import nn | |
class MultiSampleDropout(nn.Module): | |
def __init__(self, dropout_probs, problem_type, num_labels) -> None: | |
super().__init__() | |
self.dropouts = [nn.Dropout(p=p) for p in dropout_probs] | |
self.problem_type = problem_type |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
from typing import Any, Optional, Union, Tuple | |
import torch | |
from torch import nn | |
from transformers.activations import ACT2FN | |
from transformers.models.deberta.modeling_deberta import ( | |
DebertaPreTrainedModel, | |
DebertaModel, | |
) | |
from transformers.models.deberta_v2.modeling_deberta_v2 import ( |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
def reinit_model_weights(model, n_layers, config): | |
# use whatever you named your transformer module | |
backbone = model.backbone | |
encoder_layers = backbone.encoder.layer | |
reinit_layers(encoder_layers, n_layers, std) | |
# use whatever you named the output | |
reinit_modules([model.output], std) |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
from torch import nn | |
from transformers import AutoModel | |
class Model(nn.Module): | |
def __init__(self, config): | |
super().__init__() | |
self.model = AutoModel.from_pretrained(...) | |
self.dropout = nn.Dropout(config.hidden_dropout_prob) |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
# full name to abbreviation here: https://gist.github.com/mshafrir/2646763 | |
ste_to_reg = { | |
'AA': 'Other', | |
'AE': 'Other', | |
'AP': 'Other', | |
'AK': 'West', | |
'AL': 'South', | |
'AR': 'South', | |
'AS': 'Other', |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
# see here https://huggingface.co/docs/datasets/faiss_and_ea.html#adding-a-faiss-index | |
# I loaded my dataset from a Pandas dataframe | |
import pandas as pd | |
df = pd.read_csv("dataset.csv") | |
from transformers import DPRContextEncoder, DPRContextEncoderTokenizerFast | |
import torch | |
torch.set_grad_enabled(False) |
NewerOlder