Lavorare con Hugging Face
Jacob H. Marquez
Lead Data Engineer
from transformers import pipeline
my_pipeline = pipeline(
"text-classification",
model="distilbert-base-uncased-finetuned-sst-2-english"))
print(my_pipeline("Wi-Fi is slower than a snail today!"))
[{'label': 'NEGATIVE', 'score': 0.99}]
$$
$$

$$
from transformers import AutoModelForSequenceClassification# Scarica un modello pre-addestrato di classificazione del testo model = AutoModelForSequenceClassification.from_pretrained( "distilbert-base-uncased-finetuned-sst-2-english" )
$$
from transformers import AutoTokenizer# Recupera il tokenizer abbinato al modello tokenizer = AutoTokenizer.from_pretrained( "distilbert-base-uncased-finetuned-sst-2-english" )
$$
tokenizer = AutoTokenizer.from_pretrained("distilbert-base-uncased")# Tokenizza il testo di input tokens = tokenizer.tokenize("AI: Helping robots think and humans overthink:)") print(tokens)
['ai', ':', 'helping', 'robots', 'think', 'and',
'humans', 'over', '##thi', '##nk', ':', ')']
Il nostro modello (distilbert-base-uncased):
['ai', ':', 'helping', 'robots', 'think', 'and', 'humans', 'over', '##thi',
'##nk', ':', ')']
Tokenizer BERT-Base-Cased:
['AI', ':', 'Help', '##ing', 'robots', 'think', 'and', 'humans', 'over',
'##thin', '##k', ':', ')']
from transformers import AutoModelForSequenceClassification, AutoTokenizer, pipeline# Scarica il modello e il tokenizer my_model = AutoModelForSequenceClassification.from_pretrained( "distilbert-base-uncased-finetuned-sst-2-english") my_tokenizer = AutoTokenizer.from_pretrained( "distilbert-base-uncased-finetuned-sst-2-english")# Crea la pipeline personalizzata my_pipeline = pipeline( task="sentiment-analysis", model=my_model, tokenizer=my_tokenizer)
$$
🔧 Usale per più controllo e personalizzazione
📝 Preprocessing del testo: pulisci e tokenizza per casi d'uso specifici
$$

Lavorare con Hugging Face