VinceItsMe
/

MyFirstModel

Text Classification

sentence-transformers

Model card Files Files and versions Community

MyFirstModel / newtest.py

vincenttruum

test

043aa62 over 1 year ago

1.37 kB

	from datasets import load_dataset
	from sentence_transformers.losses import CosineSimilarityLoss

	from setfit import SetFitModel, SetFitTrainer, sample_dataset


	# Load a dataset from the Hugging Face Hub
	dataset = load_dataset("sst2")

	# Simulate the few-shot regime by sampling 8 examples per class
	train_dataset = sample_dataset(dataset["train"], label_column="label", num_samples=8)
	eval_dataset = dataset["validation"]

	# Load a SetFit model from Hub
	model = SetFitModel.from_pretrained("sentence-transformers/paraphrase-mpnet-base-v2")

	# Create trainer
	trainer = SetFitTrainer(
	model=model,
	train_dataset=train_dataset,
	eval_dataset=eval_dataset,
	loss_class=CosineSimilarityLoss,
	metric="accuracy",
	batch_size=16,
	num_iterations=20, # The number of text pairs to generate for contrastive learning
	num_epochs=1, # The number of epochs to use for contrastive learning
	column_mapping={"sentence": "text", "label": "label"} # Map dataset columns to text/label expected by trainer
	)

	# Train and evaluate
	trainer.train()
	metrics = trainer.evaluate()

	# Push model to the Hub
	trainer.push_to_hub("my-awesome-setfit-model")

	# Download from Hub and run inference
	model = SetFitModel.from_pretrained("lewtun/my-awesome-setfit-model")
	# Run inference
	preds = model(["i loved the spiderman movie!", "pineapple on pizza is the worst 🤮"])