I execte doc2vec model for text similarity my code and not obtain reslt
it = LabeledLineSentence(datafiles, labels1)
model = gensim.models.Doc2Vec(vector_size=300, min_count=0, alpha=0.025, min_alpha=0.025)
model.build_vocab(it)
#training of model
for epoch in range(100):
print ('iteration '+str(epoch+1))
model.train(it,total_examples=model.corpus_count,
epochs=model.epochs)
model.alpha -= 0.002
model.min_alpha = model.alpha
#saving the created model
model.save('doc2vec.model')
print ("model saved")
#loading the model
d2v_model = gensim.models.doc2vec.Doc2Vec.load('doc2vec.model')
#start testing
seed_text = "consider illegal immoral plagiarism do various"
tokens1 = seed_text.lower().split()
vector1 = d2v_model.infer_vector(tokens1)
#to get most similar document with similarity scores using document-index
most_similar = d2v_model.docvecs.most_similar(positive = [vector1] )
# output_sentences(most_similar)
print(u'%s %s: %s\n' % ("Most", most_similar[0][1], data[int(most_similar[0][0])]))
It output
Most 0.14691241085529327: M
why not print data bt only M what mean , what can i do to solve the problem Regards