This commit is contained in:
2025-06-30 14:19:58 -04:00
parent 21b7ccb794
commit c8dbef2c0f
10 changed files with 96383 additions and 48 deletions

View File

@@ -1,6 +1,9 @@
import numpy as np
import json
datum = np.load('dump.npz.npy')
import numpy as np
#datum = np.load('dump.npz.npy')
datum = np.load('dump_so400m.npy')
with open('dump.json','r') as rr:
@@ -29,25 +32,15 @@ def cosine_sim(emb_in_1, emb_in_2):
arr_in_deepstream = np.asarray([y for _,y in emb_dict.items()])
normed = np.divide(datum.T, np.linalg.norm(datum, axis=1)).T
print('_________________________')
print(len(emb_dict))
print(len(datum))
for fr, emb in emb_dict.items():
emb1 = np.linalg.norm(emb)
emb2 = np.linalg.norm(datum[fr])
# print( cosine_sim(emb, datum[fr]))
print( cosine_sim(emb, datum[fr]))
print('Deepstream and Actual norm')
print(np.max(np.dot(arr_in_deepstream, normed.T),axis=1))
print('_________________________')
for dat in datum:
# print(cosine_sim(dat, datum[0]))
pass
#print(cosine_sim(datum[fr], datum[fr+1]))
#print(cosine_sim(emb_dict[fr], emb_dict[fr+1]))