From d1165a77574aa61a4fb880ca191057b899915516 Mon Sep 17 00:00:00 2001 From: Ted Sanders Date: Thu, 19 Jan 2023 10:11:34 -0800 Subject: [PATCH] normalizes averaged embeddings to length 1 --- examples/Embedding_long_inputs.ipynb | 1 + 1 file changed, 1 insertion(+) diff --git a/examples/Embedding_long_inputs.ipynb b/examples/Embedding_long_inputs.ipynb index 33be821..fe6b5fa 100644 --- a/examples/Embedding_long_inputs.ipynb +++ b/examples/Embedding_long_inputs.ipynb @@ -205,6 +205,7 @@ "\n", " if average:\n", " chunk_embeddings = np.average(chunk_embeddings, axis=0, weights=[len(c) for c in chunk_embeddings]).tolist()\n", + " chunk_embeddings = chunk_embeddings / np.linalg.norm(chunk_embeddings) # normalizes length to 1\n", " return chunk_embeddings" ] },