Quintino Fernandes commited on
Commit
a988661
·
1 Parent(s): fce85f3

Same similarity problem

Browse files
database/query_processor.py CHANGED
@@ -118,7 +118,7 @@ class QueryProcessor:
118
  print("Starting first summary generation")
119
  embeddings = self.embedding_model.encode(sentences)
120
  print("Embeddings generated first summary")
121
- similarity_matrix = self.embedding_model.similarity(embeddings, embeddings).numpy
122
  centrality_scores = degree_centrality_scores(similarity_matrix, threshold=None)
123
 
124
  top_indices = np.argsort(-centrality_scores)[:10]
 
118
  print("Starting first summary generation")
119
  embeddings = self.embedding_model.encode(sentences)
120
  print("Embeddings generated first summary")
121
+ similarity_matrix = np.dot(embeddings, embeddings.T) / (np.linalg.norm(embeddings, axis=1, keepdims=True) * np.linalg.norm(embeddings, axis=1, keepdims=True).T)
122
  centrality_scores = degree_centrality_scores(similarity_matrix, threshold=None)
123
 
124
  top_indices = np.argsort(-centrality_scores)[:10]
models/embedding.py CHANGED
@@ -7,7 +7,4 @@ class EmbeddingModel:
7
  self.model = SentenceTransformer("paraphrase-multilingual-MiniLM-L12-v2")
8
 
9
  def encode(self, text: str):
10
- return self.model.encode(text, device=self.device)
11
-
12
- def similarity(self, embeddings):
13
- return self.model.similarity(embeddings, embeddings)
 
7
  self.model = SentenceTransformer("paraphrase-multilingual-MiniLM-L12-v2")
8
 
9
  def encode(self, text: str):
10
+ return self.model.encode(text, device=self.device)