You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

LlavaInteractiveModeExecute.cs 5.5 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129
  1. using System.Text.RegularExpressions;
  2. using LLama.Batched;
  3. using LLama.Common;
  4. using Spectre.Console;
  5. using LLama.Abstractions;
  6. using LLama.Native;
  7. namespace LLama.Examples.Examples
  8. {
  9. // This example shows how to chat with LLaVA model with both image and text as input.
  10. // It uses the interactive executor to inference.
  11. public class LlavaInteractiveModeExecute
  12. {
  13. public static async Task Run()
  14. {
  15. string multiModalProj = UserSettings.GetMMProjPath();
  16. string modelPath = UserSettings.GetModelPath();
  17. string modelImage = UserSettings.GetImagePath();
  18. const int maxTokens = 1024;
  19. var prompt = $"{{{modelImage}}}\nUSER:\nProvide a full description of the image.\nASSISTANT:\n";
  20. var parameters = new ModelParams(modelPath)
  21. {
  22. };
  23. using var model = LLamaWeights.LoadFromFile(parameters);
  24. using var context = model.CreateContext(parameters);
  25. // Llava Init
  26. using var clipModel = LLavaWeights.LoadFromFile(multiModalProj);
  27. var ex = new InteractiveExecutor(context, clipModel );
  28. Console.ForegroundColor = ConsoleColor.Yellow;
  29. Console.WriteLine("The executor has been enabled. In this example, the prompt is printed, the maximum tokens is set to {0} and the context size is {1}.", maxTokens, parameters.ContextSize );
  30. Console.WriteLine("To send an image, enter its filename in curly braces, like this {c:/image.jpg}.");
  31. var inferenceParams = new InferenceParams() { Temperature = 0.1f, AntiPrompts = new List<string> { "\nUSER:" }, MaxTokens = maxTokens };
  32. do
  33. {
  34. // Evaluate if we have images
  35. //
  36. var imageMatches = Regex.Matches(prompt, "{([^}]*)}").Select(m => m.Value);
  37. var imageCount = imageMatches.Count();
  38. var hasImages = imageCount > 0;
  39. byte[][] imageBytes = null;
  40. if (hasImages)
  41. {
  42. var imagePathsWithCurlyBraces = Regex.Matches(prompt, "{([^}]*)}").Select(m => m.Value);
  43. var imagePaths = Regex.Matches(prompt, "{([^}]*)}").Select(m => m.Groups[1].Value);
  44. try
  45. {
  46. imageBytes = imagePaths.Select(File.ReadAllBytes).ToArray();
  47. }
  48. catch (IOException exception)
  49. {
  50. Console.ForegroundColor = ConsoleColor.Red;
  51. Console.Write(
  52. $"Could not load your {(imageCount == 1 ? "image" : "images")}:");
  53. Console.Write($"{exception.Message}");
  54. Console.ForegroundColor = ConsoleColor.Yellow;
  55. Console.WriteLine("Please try again.");
  56. break;
  57. }
  58. // Each prompt with images we clear cache
  59. // When the prompt contains images we clear KV_CACHE to restart conversation
  60. ex.Context.NativeHandle.KvCacheRemove( LLamaSeqId.Zero, -1, -1 );
  61. int index = 0;
  62. foreach (var path in imagePathsWithCurlyBraces)
  63. {
  64. // First image replace to tag <image, the rest of the images delete the tag
  65. if (index++ == 0)
  66. prompt = prompt.Replace(path, "<image>");
  67. else
  68. prompt = prompt.Replace(path, "");
  69. }
  70. Console.ForegroundColor = ConsoleColor.Yellow;
  71. Console.WriteLine($"Here are the images, that are sent to the chat model in addition to your message.");
  72. Console.WriteLine();
  73. foreach (var consoleImage in imageBytes?.Select(bytes => new CanvasImage(bytes)))
  74. {
  75. consoleImage.MaxWidth = 50;
  76. AnsiConsole.Write(consoleImage);
  77. }
  78. Console.WriteLine();
  79. Console.ForegroundColor = ConsoleColor.Yellow;
  80. Console.WriteLine($"The images were scaled down for the console only, the model gets full versions.");
  81. Console.WriteLine($"Write /exit or press Ctrl+c to return to main menu.");
  82. Console.WriteLine();
  83. // Initilize Images in executor
  84. //
  85. foreach (var image in imagePaths)
  86. {
  87. ex.Images.Add(File.ReadAllBytes(image));
  88. }
  89. }
  90. Console.ForegroundColor = Color.White;
  91. await foreach (var text in ex.InferAsync(prompt, inferenceParams))
  92. {
  93. Console.Write(text);
  94. }
  95. Console.Write(" ");
  96. Console.ForegroundColor = ConsoleColor.Green;
  97. prompt = Console.ReadLine();
  98. Console.WriteLine();
  99. // let the user finish with exit
  100. //
  101. if (prompt.Equals("/exit", StringComparison.OrdinalIgnoreCase))
  102. break;
  103. }
  104. while(true);
  105. }
  106. }
  107. }