Skip to content

Instantly share code, notes, and snippets.

@davidmezzetti
Created October 20, 2021 15:47
Show Gist options
  • Save davidmezzetti/c213cd9b8dd4aadb180b3bb1e3cf6c30 to your computer and use it in GitHub Desktop.
Save davidmezzetti/c213cd9b8dd4aadb180b3bb1e3cf6c30 to your computer and use it in GitHub Desktop.
import time
from txtai.pipeline import Labels
# Create labels instances per model type
tflabels = Labels(train("microsoft/xtremedistil-l6-h384-uncased", ds["train"], logging_steps=2000), dynamic=False)
thlabels = Labels((model, tokenizer), dynamic=False)
thlabels.pipeline.model.config.id2label = {0: "sadness", 1: "joy", 2: "love", 3: "anger", 4: "fear", 5: "surprise"}
sklabels = Labels((skmodel, tokenize), dynamic=False)
sklabels.pipeline.model.config.id2label = {0: "sadness", 1: "joy", 2: "love", 3: "anger", 4: "fear", 5: "surprise"}
# Test inputs
inputs = ds["test"]["text"]
print("Testing speed of %d items" % len(inputs))
start = time.time()
tflabels(inputs)
print("Transformers time =", time.time() - start)
start = time.time()
thlabels(inputs)
print("PyTorch time =", time.time() - start)
start = time.time()
sklabels(inputs, multilabel=None)
print("TF-IDF + Logistic Regression time =", time.time() - start)
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment