word_2_vec.py 249 B

123456789
  1. import jieba
  2. def process_text(model, text):
  3. words = list(jieba.cut(text)) # 中文分词
  4. vectors = []
  5. for word in words:
  6. vec = model.encode(word) # 用encode方法取向量
  7. vectors.append(vec)
  8. return words, vectors