Transformers How to use linhphanff/phobert-base-v2-flash-attention with Transformers:
# Use a pipeline as a high-level helper
from transformers import pipeline
pipe = pipeline("feature-extraction", model="linhphanff/phobert-base-v2-flash-attention") # Load model directly
from transformers import AutoTokenizer, AutoModel
tokenizer = AutoTokenizer.from_pretrained("linhphanff/phobert-base-v2-flash-attention")
model = AutoModel.from_pretrained("linhphanff/phobert-base-v2-flash-attention")