mlx-community
/

embeddinggemma-300m-qat-q4_0-unquantized-bf16

Sentence Similarity

sentence-transformers

feature-extraction

Model card Files Files and versions

prince-canuma commited on 15 days ago

Commit

41b4b86

·

verified ·

1 Parent(s): 63783b2

Update README.md

Files changed (1) hide show

README.md +8 -5

README.md CHANGED Viewed

@@ -30,7 +30,6 @@ import mlx.core as mx
 model, tokenizer = load("mlx-community/embeddinggemma-300m-qat-q4_0-unquantized-bf16")
 # For text embedding
 sentences = [
     "task: sentence similarity | query: Nothing really matters.",
@@ -43,10 +42,15 @@ encoded_input = tokenizer(sentences, padding=True, truncation=True, return_tenso
 # Compute token embeddings
 input_ids = encoded_input['input_ids']
 attention_mask = encoded_input['attention_mask']
-model_output = model(input_ids, attention_mask)
-print("Sentence embeddings:")
-print(model_output.text_embeds)
 # You can use these task-specific prefixes for different tasks
@@ -66,5 +70,4 @@ task_prefixes = {
     "document": "title: none | text: "
 }
 ```

 model, tokenizer = load("mlx-community/embeddinggemma-300m-qat-q4_0-unquantized-bf16")
 # For text embedding
 sentences = [
     "task: sentence similarity | query: Nothing really matters.",
 # Compute token embeddings
 input_ids = encoded_input['input_ids']
 attention_mask = encoded_input['attention_mask']
+output = model(input_ids, attention_mask)
+embeddings = output.text_embeds  # Normalized embeddings
+# Compute dot product between normalized embeddings
+similarity_matrix = mx.matmul(embeddings, embeddings.T)
+print("Similarity matrix between texts:")
+print(similarity_matrix)
 # You can use these task-specific prefixes for different tasks
     "document": "title: none | text: "
 }
 ```