Skip to content

Instantly share code, notes, and snippets.

@aurotripathy
Created March 26, 2026 00:12
Show Gist options
  • Select an option

  • Save aurotripathy/9fadd8da57b9757f4fe703e677d65596 to your computer and use it in GitHub Desktop.

Select an option

Save aurotripathy/9fadd8da57b9757f4fe703e677d65596 to your computer and use it in GitHub Desktop.
# https://qwen.ai/blog?id=qwen3-vl-embedding
from pudb import set_trace
from furiosa_llm import LLM, PoolingParams
import numpy as np
import torch
queries = ["A woman playing with her dog on a beach at sunset.",
"Pet owner training dog outdoors near water.",
"Woman surfing on waves during a sunny day.",
"City skyline view from a high-rise building at night.",
]
documents = ["A woman playing with her dog on a beach at sunrise.",
"Dog owner training dog outdoors near ocean.",
"Woman surfing on waves during a rainy day.",
"City skyline view from a skyscrapers at day.",
]
llm = LLM("furiosa-ai/Qwen3-Embedding-8B", task='embed')
q_embeddings = llm.embed(queries)
doc_embeddings = llm.embed(documents)
q_array = torch.as_tensor([q_embeddings[i].outputs.embedding for i in range(len(queries))])
doc_array = torch.as_tensor([doc_embeddings[i].outputs.embedding for i in range(len(documents))])
# Compute similarity scores between query embeddings and document embeddings
similarity_scores = q_array @ doc_array.T
set_trace()
# Print out the similarity scores in a list format
print(similarity_scores.tolist())
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment