import gensim
from gensim.models import Word2Vec
import numpy as np
financial_corpus = [
['茅台', '股价', '上涨', '白酒', '板块', '走强'],
['银行', '股', '下跌', '利率', '上调', '影响'],
['科技', '股', '大涨', 'AI', '概念', '活跃'],
['白酒', '板块', '回调', '茅台', '估值', '偏高'],
['新能源', '汽车', '销量', '增长', '利好', '产业链'],
]
model = Word2Vec(
sentences=financial_corpus,
vector_size=100,
window=5,
min_count=1,
workers=4,
sg=1
)
print("与'茅台'最相似的词:")
for word, sim in model.wv.most_similar('茅台', topn=3):
print(f" {word}: {sim:.3f}")
result = model.wv.most_similar(
positive=['科技', '白酒'],
negative=['茅台']
)
print(f"\n科技 - 茅台 + 白酒 ≈ {result[0][0]}")
model.save('financial_word2vec.model')
maotai_vec = model.wv['茅台']