VinceItsMe
/

MyFirstModel

Text Classification

sentence-transformers

Model card Files Files and versions Community

vincenttruum commited on Jan 23, 2023

Commit

043aa62

•

1 Parent(s): 7820bb0

test

Files changed (1) hide show

newtest.py +39 -2

newtest.py CHANGED Viewed

@@ -1,3 +1,40 @@
-from datasets import load_dataset,concatenate_datasets
-from setfit import SetFitModel, SetFitTrainer
 from sentence_transformers.losses import CosineSimilarityLoss

+from datasets import load_dataset
 from sentence_transformers.losses import CosineSimilarityLoss
+from setfit import SetFitModel, SetFitTrainer, sample_dataset
+# Load a dataset from the Hugging Face Hub
+dataset = load_dataset("sst2")
+# Simulate the few-shot regime by sampling 8 examples per class
+train_dataset = sample_dataset(dataset["train"], label_column="label", num_samples=8)
+eval_dataset = dataset["validation"]
+# Load a SetFit model from Hub
+model = SetFitModel.from_pretrained("sentence-transformers/paraphrase-mpnet-base-v2")
+# Create trainer
+trainer = SetFitTrainer(
+    model=model,
+    train_dataset=train_dataset,
+    eval_dataset=eval_dataset,
+    loss_class=CosineSimilarityLoss,
+    metric="accuracy",
+    batch_size=16,
+    num_iterations=20, # The number of text pairs to generate for contrastive learning
+    num_epochs=1, # The number of epochs to use for contrastive learning
+    column_mapping={"sentence": "text", "label": "label"} # Map dataset columns to text/label expected by trainer
+)
+# Train and evaluate
+trainer.train()
+metrics = trainer.evaluate()
+# Push model to the Hub
+trainer.push_to_hub("my-awesome-setfit-model")
+# Download from Hub and run inference
+model = SetFitModel.from_pretrained("lewtun/my-awesome-setfit-model")
+# Run inference
+preds = model(["i loved the spiderman movie!", "pineapple on pizza is the worst 🤮"])