
代码如下:
import faiss
import numpy as np
from transformers import AutoTokenizer, AutoModel
# 加载text2vec-large-chinese模型和分词器
model_name = "bert-base-chinese"
tokenizer = AutoTokenizer.from_pretrained(model_name)
model = AutoModel.from_pretrained(model_name)
# 假设您有两个字符串s1和s2
s1 = "北京是中国的...