You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

LLamaEmbedderTests.cs 1.4 kB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758
  1. using LLama.Common;
  2. namespace LLama.Unittest;
  3. public sealed class LLamaEmbedderTests
  4. : IDisposable
  5. {
  6. private readonly LLamaEmbedder _embedder;
  7. public LLamaEmbedderTests()
  8. {
  9. var @params = new ModelParams(Constants.ModelPath);
  10. using var weights = LLamaWeights.LoadFromFile(@params);
  11. _embedder = new(weights, @params);
  12. }
  13. public void Dispose()
  14. {
  15. _embedder.Dispose();
  16. }
  17. private static float Magnitude(float[] a)
  18. {
  19. return MathF.Sqrt(a.Zip(a, (x, y) => x * y).Sum());
  20. }
  21. private static void Normalize(float[] a)
  22. {
  23. var mag = Magnitude(a);
  24. for (var i = 0; i < a.Length; i++)
  25. a[i] /= mag;
  26. }
  27. private static float Dot(float[] a, float[] b)
  28. {
  29. Assert.Equal(a.Length, b.Length);
  30. return a.Zip(b, (x, y) => x * y).Sum();
  31. }
  32. [Fact]
  33. public void EmbedCompare()
  34. {
  35. var cat = _embedder.GetEmbeddings("cat");
  36. var kitten = _embedder.GetEmbeddings("kitten");
  37. var spoon = _embedder.GetEmbeddings("spoon");
  38. Normalize(cat);
  39. Normalize(kitten);
  40. Normalize(spoon);
  41. var close = Dot(cat, kitten);
  42. var far = Dot(cat, spoon);
  43. // This comparison seems backwards, but remember that with a
  44. // dot product 1.0 means **identical** and 0.0 means **completely opposite**!
  45. Assert.True(close > far);
  46. }
  47. }