File size: 461 Bytes
d2237d8
 
 
9dcc0d8
 
 
d2237d8
 
 
9dcc0d8
 
 
d2237d8
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
import os
from transformers import AutoTokenizer, AutoModelForTokenClassification, pipeline

os.environ["TRANSFORMERS_CACHE"] = "/tmp/hf_cache"


HF_TOKEN = os.getenv("HF_TOKEN")
MODEL_ID = "TypicaAI/magbert-ner"

tokenizer = AutoTokenizer.from_pretrained(MODEL_ID, token=HF_TOKEN)
model = AutoModelForTokenClassification.from_pretrained(MODEL_ID, token=HF_TOKEN)


ner_pipeline = pipeline("ner", model=model, tokenizer=tokenizer, aggregation_strategy="first")