CLIP-Notebook.ipynb
text_emb = text_emb / torch.norm(text_emb, dim=1, keepdim=True)

image_emb = image_emb / torch.norm(image_emb, dim=1, keepdim=True)

cos_sim = torch.mm(text_emb, image_emb.T).detach().numpy()

Create unit vectors and multiply