File size: 736 Bytes
33b10b6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
from api.calc_cosine_similarity import find_cosine_similarity, find_embedding , find_relevant_file_paths
import os
import pickle
embeddings_titles = []
if not os.path.exists('embeddings.pkl'):
    #Find embeddings of titles from titles.txt
    titles = []
    #if embedding_titles.pkl is absent
    with open('titles.txt', 'r') as file:
        lines = file.readlines()
    
    titles = [line.strip() for line in lines]
    print("Created a list of titles")
        
    embeddings_titles = find_embedding(titles)
    #Save embeddings_titles to embedding_titles.pkl
    data = {
            'sentences': titles,
            'embeddings': embeddings_titles
    }
    with open('embeddings.pkl', 'wb') as f:
        pickle.dump(data, f)