Quintino Fernandes
commited on
Commit
·
a988661
1
Parent(s):
fce85f3
Same similarity problem
Browse files- database/query_processor.py +1 -1
- models/embedding.py +1 -4
database/query_processor.py
CHANGED
@@ -118,7 +118,7 @@ class QueryProcessor:
|
|
118 |
print("Starting first summary generation")
|
119 |
embeddings = self.embedding_model.encode(sentences)
|
120 |
print("Embeddings generated first summary")
|
121 |
-
similarity_matrix =
|
122 |
centrality_scores = degree_centrality_scores(similarity_matrix, threshold=None)
|
123 |
|
124 |
top_indices = np.argsort(-centrality_scores)[:10]
|
|
|
118 |
print("Starting first summary generation")
|
119 |
embeddings = self.embedding_model.encode(sentences)
|
120 |
print("Embeddings generated first summary")
|
121 |
+
similarity_matrix = np.dot(embeddings, embeddings.T) / (np.linalg.norm(embeddings, axis=1, keepdims=True) * np.linalg.norm(embeddings, axis=1, keepdims=True).T)
|
122 |
centrality_scores = degree_centrality_scores(similarity_matrix, threshold=None)
|
123 |
|
124 |
top_indices = np.argsort(-centrality_scores)[:10]
|
models/embedding.py
CHANGED
@@ -7,7 +7,4 @@ class EmbeddingModel:
|
|
7 |
self.model = SentenceTransformer("paraphrase-multilingual-MiniLM-L12-v2")
|
8 |
|
9 |
def encode(self, text: str):
|
10 |
-
return self.model.encode(text, device=self.device)
|
11 |
-
|
12 |
-
def similarity(self, embeddings):
|
13 |
-
return self.model.similarity(embeddings, embeddings)
|
|
|
7 |
self.model = SentenceTransformer("paraphrase-multilingual-MiniLM-L12-v2")
|
8 |
|
9 |
def encode(self, text: str):
|
10 |
+
return self.model.encode(text, device=self.device)
|
|
|
|
|
|