NLL interpretretation tool sets
Interpret huggingface tokenizer¶
from transformers import AutoTokenizer, AutoModel
PRETRAINED = "albert-base-v2"
model = AutoModel.from_pretrained(PRETRAINED)
tokenizer = AutoTokenizer.from_pretrained(PRETRAINED)
tokenizer.special_tokens_map
model.embeddings
embedding_matrix = model.embeddings.word_embeddings.weight.data.numpy()
embedding_matrix.shape
tokenizer.special_tokens_map.values
interp = InterpEmbeddingsTokenizer(
embedding_matrix,tokenizer=tokenizer)
interp.search("wife")