Spaces:

fahmiaziz
/

api-embedding

Running

App Files Files Community

fahmiaziz98 commited on Nov 10

Commit

66f2fb1

1 Parent(s): 95cd425

add model splade-large-doc

Browse files

Files changed (4) hide show

requirements.txt +3 -1
src/config/models.yaml +3 -3
vectordb/milvus_client.py +0 -0
vectordb/utils.py +77 -0

requirements.txt CHANGED Viewed

@@ -1,5 +1,7 @@
 fastapi[standard]==0.116.2
 uvicorn==0.35.0
 torch==2.8.0
 sentence-transformers==5.1.1
 loguru==0.7.3
@@ -8,4 +10,4 @@ pydantic-settings==2.11.0
 pyyaml==6.0.3
 ruff==0.14.3
 pinecone==7.3.0
-ipykernel==7.1.0

 fastapi[standard]==0.116.2
 uvicorn==0.35.0
+numpy==2.0.2
+scipy==1.16.3
 torch==2.8.0
 sentence-transformers==5.1.1
 loguru==0.7.3
 pyyaml==6.0.3
 ruff==0.14.3
 pinecone==7.3.0
+ipykernel==7.1.0

src/config/models.yaml CHANGED Viewed

@@ -7,8 +7,8 @@ models:
     name: "google/embeddinggemma-300M"
     type: "embeddings"
-  splade-pp-v2:
-    name: "prithivida/Splade_PP_en_v2"
     type: "sparse-embeddings"
   splade-large-query:
@@ -17,4 +17,4 @@ models:
   bge-v2-m3:
     name: "BAAI/bge-reranker-v2-m3"
-    type: "rerank"

     name: "google/embeddinggemma-300M"
     type: "embeddings"
+  splade-large-doc:
+    name: "naver/efficient-splade-VI-BT-large-doc"
     type: "sparse-embeddings"
   splade-large-query:
   bge-v2-m3:
     name: "BAAI/bge-reranker-v2-m3"
+    type: "rerank"

vectordb/milvus_client.py ADDED Viewed

File without changes

vectordb/utils.py ADDED Viewed

	@@ -0,0 +1,77 @@

+import numpy as np
+from scipy.sparse import csr_matrix
+from typing import Dict, List
+def convert_sparse_to_csr(sparse_dict: Dict[str, List]) -> csr_matrix:
+    """
+    Convert sparse embedding to scipy CSR matrix
+    API format: {"indices": [10, 25, 42], "values": [0.85, 0.62, 0.91]}
+    Milvus format: scipy.sparse.csr_matrix with shape (1, max_dimension)
+    Args:
+        sparse_dict: Dictionary with 'indices' and 'values'
+    Returns:
+        scipy CSR matrix
+    """
+    indices = sparse_dict["indices"]
+    values = sparse_dict["values"]
+    max_dim = max(indices) + 1 if indices else 1
+    # Create CSR matrix
+    # Shape: (1, max_dim) karena ini single vector
+    row_indices = [0] * len(indices)  # Semua di row 0
+    col_indices = indices
+    sparse_matrix = csr_matrix(
+        (values, (row_indices, col_indices)),
+        shape=(1, max_dim)
+    )
+    return sparse_matrix
+def batch_convert_sparse_to_csr(sparse_list: List[Dict[str, List]]) -> csr_matrix:
+    """
+    Convert batch of sparse embeddings to single CSR matrix
+    Args:
+        sparse_list: List of sparse dicts
+    Returns:
+        scipy CSR matrix with shape (batch_size, max_dim)
+    """
+    if not sparse_list:
+        return csr_matrix((0, 0))
+    max_dim = 0
+    for sparse_dict in sparse_list:
+        if sparse_dict["indices"]:
+            max_dim = max(max_dim, max(sparse_dict["indices"]) + 1)
+    if max_dim == 0:
+        max_dim = 30000  # Default vocab size for SPLADE
+    # Build row indices, column indices, and values
+    row_indices = []
+    col_indices = []
+    values = []
+    for row_idx, sparse_dict in enumerate(sparse_list):
+        indices = sparse_dict["indices"]
+        vals = sparse_dict["values"]
+        row_indices.extend([row_idx] * len(indices))
+        col_indices.extend(indices)
+        values.extend(vals)
+    # Create CSR matrix
+    sparse_matrix = csr_matrix(
+        (values, (row_indices, col_indices)),
+        shape=(len(sparse_list), max_dim)
+    )
+    return sparse_matrix