You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

index.html 60 kB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488248924902491249224932494249524962497249824992500250125022503250425052506250725082509251025112512251325142515251625172518251925202521252225232524252525262527252825292530253125322533253425352536253725382539254025412542254325442545254625472548254925502551255225532554255525562557255825592560256125622563256425652566256725682569257025712572257325742575257625772578257925802581258225832584258525862587258825892590259125922593259425952596259725982599260026012602260326042605260626072608260926102611261226132614261526162617261826192620262126222623262426252626262726282629263026312632263326342635263626372638263926402641264226432644264526462647264826492650265126522653265426552656265726582659266026612662266326642665266626672668266926702671267226732674267526762677267826792680268126822683268426852686268726882689269026912692269326942695269626972698269927002701270227032704270527062707270827092710271127122713271427152716271727182719272027212722272327242725272627272728272927302731273227332734273527362737273827392740274127422743274427452746274727482749275027512752275327542755275627572758275927602761276227632764276527662767276827692770277127722773277427752776277727782779278027812782278327842785278627872788278927902791279227932794279527962797279827992800280128022803280428052806280728082809281028112812281328142815281628172818281928202821282228232824282528262827282828292830283128322833283428352836283728382839284028412842284328442845284628472848284928502851285228532854285528562857285828592860286128622863286428652866286728682869287028712872287328742875287628772878287928802881288228832884288528862887288828892890289128922893289428952896289728982899290029012902290329042905290629072908290929102911
  1. <!doctype html>
  2. <html lang="en" class="no-js">
  3. <head>
  4. <meta charset="utf-8">
  5. <meta name="viewport" content="width=device-width,initial-scale=1">
  6. <link rel="prev" href="../Architecture/">
  7. <link rel="next" href="../ContributingGuide/">
  8. <link rel="icon" href="../assets/images/favicon.png">
  9. <meta name="generator" content="mkdocs-1.4.3, mkdocs-material-9.1.20">
  10. <title>FAQ - LLamaSharp Documentation</title>
  11. <link rel="stylesheet" href="../assets/stylesheets/main.eebd395e.min.css">
  12. <link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
  13. <link rel="stylesheet" href="https://fonts.googleapis.com/css?family=Roboto:300,300i,400,400i,700,700i%7CRoboto+Mono:400,400i,700,700i&display=fallback">
  14. <style>:root{--md-text-font:"Roboto";--md-code-font:"Roboto Mono"}</style>
  15. <script>__md_scope=new URL("..",location),__md_hash=e=>[...e].reduce((e,_)=>(e<<5)-e+_.charCodeAt(0),0),__md_get=(e,_=localStorage,t=__md_scope)=>JSON.parse(_.getItem(t.pathname+"."+e)),__md_set=(e,_,t=localStorage,a=__md_scope)=>{try{t.setItem(a.pathname+"."+e,JSON.stringify(_))}catch(e){}}</script>
  16. </head>
  17. <body dir="ltr">
  18. <script>var palette=__md_get("__palette");if(palette&&"object"==typeof palette.color)for(var key of Object.keys(palette.color))document.body.setAttribute("data-md-color-"+key,palette.color[key])</script>
  19. <input class="md-toggle" data-md-toggle="drawer" type="checkbox" id="__drawer" autocomplete="off">
  20. <input class="md-toggle" data-md-toggle="search" type="checkbox" id="__search" autocomplete="off">
  21. <label class="md-overlay" for="__drawer"></label>
  22. <div data-md-component="skip">
  23. <a href="#frequently-asked-qustions" class="md-skip">
  24. Skip to content
  25. </a>
  26. </div>
  27. <div data-md-component="announce">
  28. </div>
  29. <div data-md-color-scheme="default" data-md-component="outdated" hidden>
  30. </div>
  31. <header class="md-header md-header--shadow" data-md-component="header">
  32. <nav class="md-header__inner md-grid" aria-label="Header">
  33. <a href=".." title="LLamaSharp Documentation" class="md-header__button md-logo" aria-label="LLamaSharp Documentation" data-md-component="logo">
  34. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M12 8a3 3 0 0 0 3-3 3 3 0 0 0-3-3 3 3 0 0 0-3 3 3 3 0 0 0 3 3m0 3.54C9.64 9.35 6.5 8 3 8v11c3.5 0 6.64 1.35 9 3.54 2.36-2.19 5.5-3.54 9-3.54V8c-3.5 0-6.64 1.35-9 3.54Z"/></svg>
  35. </a>
  36. <label class="md-header__button md-icon" for="__drawer">
  37. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M3 6h18v2H3V6m0 5h18v2H3v-2m0 5h18v2H3v-2Z"/></svg>
  38. </label>
  39. <div class="md-header__title" data-md-component="header-title">
  40. <div class="md-header__ellipsis">
  41. <div class="md-header__topic">
  42. <span class="md-ellipsis">
  43. LLamaSharp Documentation
  44. </span>
  45. </div>
  46. <div class="md-header__topic" data-md-component="header-topic">
  47. <span class="md-ellipsis">
  48. FAQ
  49. </span>
  50. </div>
  51. </div>
  52. </div>
  53. <label class="md-header__button md-icon" for="__search">
  54. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M9.5 3A6.5 6.5 0 0 1 16 9.5c0 1.61-.59 3.09-1.56 4.23l.27.27h.79l5 5-1.5 1.5-5-5v-.79l-.27-.27A6.516 6.516 0 0 1 9.5 16 6.5 6.5 0 0 1 3 9.5 6.5 6.5 0 0 1 9.5 3m0 2C7 5 5 7 5 9.5S7 14 9.5 14 14 12 14 9.5 12 5 9.5 5Z"/></svg>
  55. </label>
  56. <div class="md-search" data-md-component="search" role="dialog">
  57. <label class="md-search__overlay" for="__search"></label>
  58. <div class="md-search__inner" role="search">
  59. <form class="md-search__form" name="search">
  60. <input type="text" class="md-search__input" name="query" aria-label="Search" placeholder="Search" autocapitalize="off" autocorrect="off" autocomplete="off" spellcheck="false" data-md-component="search-query" required>
  61. <label class="md-search__icon md-icon" for="__search">
  62. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M9.5 3A6.5 6.5 0 0 1 16 9.5c0 1.61-.59 3.09-1.56 4.23l.27.27h.79l5 5-1.5 1.5-5-5v-.79l-.27-.27A6.516 6.516 0 0 1 9.5 16 6.5 6.5 0 0 1 3 9.5 6.5 6.5 0 0 1 9.5 3m0 2C7 5 5 7 5 9.5S7 14 9.5 14 14 12 14 9.5 12 5 9.5 5Z"/></svg>
  63. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M20 11v2H8l5.5 5.5-1.42 1.42L4.16 12l7.92-7.92L13.5 5.5 8 11h12Z"/></svg>
  64. </label>
  65. <nav class="md-search__options" aria-label="Search">
  66. <button type="reset" class="md-search__icon md-icon" title="Clear" aria-label="Clear" tabindex="-1">
  67. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M19 6.41 17.59 5 12 10.59 6.41 5 5 6.41 10.59 12 5 17.59 6.41 19 12 13.41 17.59 19 19 17.59 13.41 12 19 6.41Z"/></svg>
  68. </button>
  69. </nav>
  70. </form>
  71. <div class="md-search__output">
  72. <div class="md-search__scrollwrap" data-md-scrollfix>
  73. <div class="md-search-result" data-md-component="search-result">
  74. <div class="md-search-result__meta">
  75. Initializing search
  76. </div>
  77. <ol class="md-search-result__list" role="presentation"></ol>
  78. </div>
  79. </div>
  80. </div>
  81. </div>
  82. </div>
  83. </nav>
  84. </header>
  85. <div class="md-container" data-md-component="container">
  86. <main class="md-main" data-md-component="main">
  87. <div class="md-main__inner md-grid">
  88. <div class="md-sidebar md-sidebar--primary" data-md-component="sidebar" data-md-type="navigation" >
  89. <div class="md-sidebar__scrollwrap">
  90. <div class="md-sidebar__inner">
  91. <nav class="md-nav md-nav--primary" aria-label="Navigation" data-md-level="0">
  92. <label class="md-nav__title" for="__drawer">
  93. <a href=".." title="LLamaSharp Documentation" class="md-nav__button md-logo" aria-label="LLamaSharp Documentation" data-md-component="logo">
  94. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M12 8a3 3 0 0 0 3-3 3 3 0 0 0-3-3 3 3 0 0 0-3 3 3 3 0 0 0 3 3m0 3.54C9.64 9.35 6.5 8 3 8v11c3.5 0 6.64 1.35 9 3.54 2.36-2.19 5.5-3.54 9-3.54V8c-3.5 0-6.64 1.35-9 3.54Z"/></svg>
  95. </a>
  96. LLamaSharp Documentation
  97. </label>
  98. <ul class="md-nav__list" data-md-scrollfix>
  99. <li class="md-nav__item">
  100. <a href=".." class="md-nav__link">
  101. Overview
  102. </a>
  103. </li>
  104. <li class="md-nav__item">
  105. <a href="../QuickStart/" class="md-nav__link">
  106. Quick Start
  107. </a>
  108. </li>
  109. <li class="md-nav__item">
  110. <a href="../Architecture/" class="md-nav__link">
  111. Architecture
  112. </a>
  113. </li>
  114. <li class="md-nav__item md-nav__item--active">
  115. <input class="md-nav__toggle md-toggle" type="checkbox" id="__toc">
  116. <label class="md-nav__link md-nav__link--active" for="__toc">
  117. FAQ
  118. <span class="md-nav__icon md-icon"></span>
  119. </label>
  120. <a href="./" class="md-nav__link md-nav__link--active">
  121. FAQ
  122. </a>
  123. <nav class="md-nav md-nav--secondary" aria-label="Table of contents">
  124. <label class="md-nav__title" for="__toc">
  125. <span class="md-nav__icon md-icon"></span>
  126. Table of contents
  127. </label>
  128. <ul class="md-nav__list" data-md-component="toc" data-md-scrollfix>
  129. <li class="md-nav__item">
  130. <a href="#why-gpu-is-not-used-when-i-have-installed-cuda" class="md-nav__link">
  131. Why GPU is not used when I have installed CUDA
  132. </a>
  133. </li>
  134. <li class="md-nav__item">
  135. <a href="#why-the-inference-is-slow" class="md-nav__link">
  136. Why the inference is slow
  137. </a>
  138. </li>
  139. <li class="md-nav__item">
  140. <a href="#why-the-program-crashes-before-any-output-is-generated" class="md-nav__link">
  141. Why the program crashes before any output is generated
  142. </a>
  143. </li>
  144. <li class="md-nav__item">
  145. <a href="#why-my-model-is-generating-output-infinitely" class="md-nav__link">
  146. Why my model is generating output infinitely
  147. </a>
  148. </li>
  149. <li class="md-nav__item">
  150. <a href="#how-to-run-llm-with-non-english-languages" class="md-nav__link">
  151. How to run LLM with non-English languages
  152. </a>
  153. </li>
  154. <li class="md-nav__item">
  155. <a href="#pay-attention-to-the-length-of-prompt" class="md-nav__link">
  156. Pay attention to the length of prompt
  157. </a>
  158. </li>
  159. <li class="md-nav__item">
  160. <a href="#choose-models-weight-depending-on-you-task" class="md-nav__link">
  161. Choose models weight depending on you task
  162. </a>
  163. </li>
  164. </ul>
  165. </nav>
  166. </li>
  167. <li class="md-nav__item">
  168. <a href="../ContributingGuide/" class="md-nav__link">
  169. Contributing Guide
  170. </a>
  171. </li>
  172. <li class="md-nav__item md-nav__item--nested">
  173. <input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_6" >
  174. <label class="md-nav__link" for="__nav_6" id="__nav_6_label" tabindex="0">
  175. Tutorials
  176. <span class="md-nav__icon md-icon"></span>
  177. </label>
  178. <nav class="md-nav" data-md-level="1" aria-labelledby="__nav_6_label" aria-expanded="false">
  179. <label class="md-nav__title" for="__nav_6">
  180. <span class="md-nav__icon md-icon"></span>
  181. Tutorials
  182. </label>
  183. <ul class="md-nav__list" data-md-scrollfix>
  184. <li class="md-nav__item">
  185. <a href="../Tutorials/NativeLibraryConfig/" class="md-nav__link">
  186. Customize the native library loading
  187. </a>
  188. </li>
  189. <li class="md-nav__item">
  190. <a href="../Tutorials/Executors/" class="md-nav__link">
  191. Use executors
  192. </a>
  193. </li>
  194. <li class="md-nav__item">
  195. <a href="../Tutorials/ChatSession/" class="md-nav__link">
  196. Use ChatSession
  197. </a>
  198. </li>
  199. <li class="md-nav__item">
  200. <a href="../Tutorials/UnderstandLLamaContext/" class="md-nav__link">
  201. Understand LLamaContext
  202. </a>
  203. </li>
  204. <li class="md-nav__item">
  205. <a href="../Tutorials/GetEmbeddings/" class="md-nav__link">
  206. Get embeddings
  207. </a>
  208. </li>
  209. <li class="md-nav__item">
  210. <a href="../Tutorials/Quantization/" class="md-nav__link">
  211. Quantize the model
  212. </a>
  213. </li>
  214. </ul>
  215. </nav>
  216. </li>
  217. <li class="md-nav__item md-nav__item--nested">
  218. <input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_7" >
  219. <label class="md-nav__link" for="__nav_7" id="__nav_7_label" tabindex="0">
  220. Integrations
  221. <span class="md-nav__icon md-icon"></span>
  222. </label>
  223. <nav class="md-nav" data-md-level="1" aria-labelledby="__nav_7_label" aria-expanded="false">
  224. <label class="md-nav__title" for="__nav_7">
  225. <span class="md-nav__icon md-icon"></span>
  226. Integrations
  227. </label>
  228. <ul class="md-nav__list" data-md-scrollfix>
  229. <li class="md-nav__item">
  230. <a href="../Integrations/semantic-kernel/" class="md-nav__link">
  231. semantic-kernel integration
  232. </a>
  233. </li>
  234. <li class="md-nav__item">
  235. <a href="../Integrations/kernel-memory/" class="md-nav__link">
  236. kernel-memory integration
  237. </a>
  238. </li>
  239. <li class="md-nav__item">
  240. <a href="../Integrations/BotSharp.md" class="md-nav__link">
  241. BotSharp integration
  242. </a>
  243. </li>
  244. <li class="md-nav__item">
  245. <a href="../Integrations/Langchain.md" class="md-nav__link">
  246. Langchain integration
  247. </a>
  248. </li>
  249. </ul>
  250. </nav>
  251. </li>
  252. <li class="md-nav__item md-nav__item--nested">
  253. <input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_8" >
  254. <label class="md-nav__link" for="__nav_8" id="__nav_8_label" tabindex="0">
  255. Examples
  256. <span class="md-nav__icon md-icon"></span>
  257. </label>
  258. <nav class="md-nav" data-md-level="1" aria-labelledby="__nav_8_label" aria-expanded="false">
  259. <label class="md-nav__title" for="__nav_8">
  260. <span class="md-nav__icon md-icon"></span>
  261. Examples
  262. </label>
  263. <ul class="md-nav__list" data-md-scrollfix>
  264. <li class="md-nav__item">
  265. <a href="../Examples/BatchedExecutorFork/" class="md-nav__link">
  266. Bacthed executor - multi-output to one input
  267. </a>
  268. </li>
  269. <li class="md-nav__item">
  270. <a href="../Examples/BatchedExecutorGuidance/" class="md-nav__link">
  271. Batched executor - basic guidance
  272. </a>
  273. </li>
  274. <li class="md-nav__item">
  275. <a href="../Examples/BatchedExecutorRewind/" class="md-nav__link">
  276. Batched executor - rewinding to an earlier state
  277. </a>
  278. </li>
  279. <li class="md-nav__item">
  280. <a href="../Examples/ChatChineseGB2312/" class="md-nav__link">
  281. Chinese LLM - with GB2312 encoding
  282. </a>
  283. </li>
  284. <li class="md-nav__item">
  285. <a href="../Examples/ChatSessionStripRoleName/" class="md-nav__link">
  286. ChatSession - stripping role names
  287. </a>
  288. </li>
  289. <li class="md-nav__item">
  290. <a href="../Examples/ChatSessionWithHistory/" class="md-nav__link">
  291. ChatSession - with history
  292. </a>
  293. </li>
  294. <li class="md-nav__item">
  295. <a href="../Examples/ChatSessionWithRestart/" class="md-nav__link">
  296. ChatSession - restarting
  297. </a>
  298. </li>
  299. <li class="md-nav__item">
  300. <a href="../Examples/ChatSessionWithRoleName/" class="md-nav__link">
  301. ChatSession - Basic
  302. </a>
  303. </li>
  304. <li class="md-nav__item">
  305. <a href="../Examples/CodingAssistant/" class="md-nav__link">
  306. Coding assistant
  307. </a>
  308. </li>
  309. <li class="md-nav__item">
  310. <a href="../Examples/GetEmbeddings/" class="md-nav__link">
  311. Get embeddings
  312. </a>
  313. </li>
  314. <li class="md-nav__item">
  315. <a href="../Examples/GrammarJsonResponse/" class="md-nav__link">
  316. Grammar - json response
  317. </a>
  318. </li>
  319. <li class="md-nav__item">
  320. <a href="../Examples/InstructModeExecute/" class="md-nav__link">
  321. Instruct executor - basic
  322. </a>
  323. </li>
  324. <li class="md-nav__item">
  325. <a href="../Examples/InteractiveModeExecute/" class="md-nav__link">
  326. Interactive executor - basic
  327. </a>
  328. </li>
  329. <li class="md-nav__item">
  330. <a href="../Examples/KernelMemory/" class="md-nav__link">
  331. Kernel memory integration - basic
  332. </a>
  333. </li>
  334. <li class="md-nav__item">
  335. <a href="../Examples/KernelMemorySaveAndLoad/" class="md-nav__link">
  336. Kernel-memory - save & load
  337. </a>
  338. </li>
  339. <li class="md-nav__item">
  340. <a href="../Examples/LLavaInteractiveModeExecute/" class="md-nav__link">
  341. LLaVA - basic
  342. </a>
  343. </li>
  344. <li class="md-nav__item">
  345. <a href="../Examples/LoadAndSaveSession/" class="md-nav__link">
  346. ChatSession - load & save
  347. </a>
  348. </li>
  349. <li class="md-nav__item">
  350. <a href="../Examples/LoadAndSaveState/" class="md-nav__link">
  351. Executor - save/load state
  352. </a>
  353. </li>
  354. <li class="md-nav__item">
  355. <a href="../Examples/QuantizeModel/" class="md-nav__link">
  356. Quantization
  357. </a>
  358. </li>
  359. <li class="md-nav__item">
  360. <a href="../Examples/SemanticKernelChat/" class="md-nav__link">
  361. Semantic-kernel - chat
  362. </a>
  363. </li>
  364. <li class="md-nav__item">
  365. <a href="../Examples/SemanticKernelMemory/" class="md-nav__link">
  366. Semantic-kernel - with kernel-memory
  367. </a>
  368. </li>
  369. <li class="md-nav__item">
  370. <a href="../Examples/SemanticKernelPrompt/" class="md-nav__link">
  371. Semantic-kernel - basic
  372. </a>
  373. </li>
  374. <li class="md-nav__item">
  375. <a href="../Examples/StatelessModeExecute/" class="md-nav__link">
  376. Stateless executor
  377. </a>
  378. </li>
  379. <li class="md-nav__item">
  380. <a href="../Examples/TalkToYourself/" class="md-nav__link">
  381. Talk to yourself
  382. </a>
  383. </li>
  384. </ul>
  385. </nav>
  386. </li>
  387. <li class="md-nav__item md-nav__item--nested">
  388. <input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_9" >
  389. <label class="md-nav__link" for="__nav_9" id="__nav_9_label" tabindex="0">
  390. API Reference
  391. <span class="md-nav__icon md-icon"></span>
  392. </label>
  393. <nav class="md-nav" data-md-level="1" aria-labelledby="__nav_9_label" aria-expanded="false">
  394. <label class="md-nav__title" for="__nav_9">
  395. <span class="md-nav__icon md-icon"></span>
  396. API Reference
  397. </label>
  398. <ul class="md-nav__list" data-md-scrollfix>
  399. <li class="md-nav__item">
  400. <a href="../xmldocs/" class="md-nav__link">
  401. index
  402. </a>
  403. </li>
  404. <li class="md-nav__item">
  405. <a href="../xmldocs/llama.abstractions.adaptercollection/" class="md-nav__link">
  406. llama.abstractions.adaptercollection
  407. </a>
  408. </li>
  409. <li class="md-nav__item">
  410. <a href="../xmldocs/llama.abstractions.icontextparams/" class="md-nav__link">
  411. llama.abstractions.icontextparams
  412. </a>
  413. </li>
  414. <li class="md-nav__item">
  415. <a href="../xmldocs/llama.abstractions.ihistorytransform/" class="md-nav__link">
  416. llama.abstractions.ihistorytransform
  417. </a>
  418. </li>
  419. <li class="md-nav__item">
  420. <a href="../xmldocs/llama.abstractions.iinferenceparams/" class="md-nav__link">
  421. llama.abstractions.iinferenceparams
  422. </a>
  423. </li>
  424. <li class="md-nav__item">
  425. <a href="../xmldocs/llama.abstractions.illamaexecutor/" class="md-nav__link">
  426. llama.abstractions.illamaexecutor
  427. </a>
  428. </li>
  429. <li class="md-nav__item">
  430. <a href="../xmldocs/llama.abstractions.illamaparams/" class="md-nav__link">
  431. llama.abstractions.illamaparams
  432. </a>
  433. </li>
  434. <li class="md-nav__item">
  435. <a href="../xmldocs/llama.abstractions.imodelparams/" class="md-nav__link">
  436. llama.abstractions.imodelparams
  437. </a>
  438. </li>
  439. <li class="md-nav__item">
  440. <a href="../xmldocs/llama.abstractions.itextstreamtransform/" class="md-nav__link">
  441. llama.abstractions.itextstreamtransform
  442. </a>
  443. </li>
  444. <li class="md-nav__item">
  445. <a href="../xmldocs/llama.abstractions.itexttransform/" class="md-nav__link">
  446. llama.abstractions.itexttransform
  447. </a>
  448. </li>
  449. <li class="md-nav__item">
  450. <a href="../xmldocs/llama.abstractions.loraadapter/" class="md-nav__link">
  451. llama.abstractions.loraadapter
  452. </a>
  453. </li>
  454. <li class="md-nav__item">
  455. <a href="../xmldocs/llama.abstractions.metadataoverride/" class="md-nav__link">
  456. llama.abstractions.metadataoverride
  457. </a>
  458. </li>
  459. <li class="md-nav__item">
  460. <a href="../xmldocs/llama.abstractions.metadataoverrideconverter/" class="md-nav__link">
  461. llama.abstractions.metadataoverrideconverter
  462. </a>
  463. </li>
  464. <li class="md-nav__item">
  465. <a href="../xmldocs/llama.abstractions.tensorsplitscollection/" class="md-nav__link">
  466. llama.abstractions.tensorsplitscollection
  467. </a>
  468. </li>
  469. <li class="md-nav__item">
  470. <a href="../xmldocs/llama.abstractions.tensorsplitscollectionconverter/" class="md-nav__link">
  471. llama.abstractions.tensorsplitscollectionconverter
  472. </a>
  473. </li>
  474. <li class="md-nav__item">
  475. <a href="../xmldocs/llama.antipromptprocessor/" class="md-nav__link">
  476. llama.antipromptprocessor
  477. </a>
  478. </li>
  479. <li class="md-nav__item">
  480. <a href="../xmldocs/llama.batched.alreadypromptedconversationexception/" class="md-nav__link">
  481. llama.batched.alreadypromptedconversationexception
  482. </a>
  483. </li>
  484. <li class="md-nav__item">
  485. <a href="../xmldocs/llama.batched.batchedexecutor/" class="md-nav__link">
  486. llama.batched.batchedexecutor
  487. </a>
  488. </li>
  489. <li class="md-nav__item">
  490. <a href="../xmldocs/llama.batched.cannotforkwhilerequiresinferenceexception/" class="md-nav__link">
  491. llama.batched.cannotforkwhilerequiresinferenceexception
  492. </a>
  493. </li>
  494. <li class="md-nav__item">
  495. <a href="../xmldocs/llama.batched.cannotmodifywhilerequiresinferenceexception/" class="md-nav__link">
  496. llama.batched.cannotmodifywhilerequiresinferenceexception
  497. </a>
  498. </li>
  499. <li class="md-nav__item">
  500. <a href="../xmldocs/llama.batched.cannotsamplerequiresinferenceexception/" class="md-nav__link">
  501. llama.batched.cannotsamplerequiresinferenceexception
  502. </a>
  503. </li>
  504. <li class="md-nav__item">
  505. <a href="../xmldocs/llama.batched.cannotsamplerequirespromptexception/" class="md-nav__link">
  506. llama.batched.cannotsamplerequirespromptexception
  507. </a>
  508. </li>
  509. <li class="md-nav__item">
  510. <a href="../xmldocs/llama.batched.conversation/" class="md-nav__link">
  511. llama.batched.conversation
  512. </a>
  513. </li>
  514. <li class="md-nav__item">
  515. <a href="../xmldocs/llama.batched.conversationextensions/" class="md-nav__link">
  516. llama.batched.conversationextensions
  517. </a>
  518. </li>
  519. <li class="md-nav__item">
  520. <a href="../xmldocs/llama.batched.experimentalbatchedexecutorexception/" class="md-nav__link">
  521. llama.batched.experimentalbatchedexecutorexception
  522. </a>
  523. </li>
  524. <li class="md-nav__item">
  525. <a href="../xmldocs/llama.chatsession-1/" class="md-nav__link">
  526. llama.chatsession-1
  527. </a>
  528. </li>
  529. <li class="md-nav__item">
  530. <a href="../xmldocs/llama.chatsession/" class="md-nav__link">
  531. llama.chatsession
  532. </a>
  533. </li>
  534. <li class="md-nav__item">
  535. <a href="../xmldocs/llama.common.authorrole/" class="md-nav__link">
  536. llama.common.authorrole
  537. </a>
  538. </li>
  539. <li class="md-nav__item">
  540. <a href="../xmldocs/llama.common.chathistory/" class="md-nav__link">
  541. llama.common.chathistory
  542. </a>
  543. </li>
  544. <li class="md-nav__item">
  545. <a href="../xmldocs/llama.common.fixedsizequeue-1/" class="md-nav__link">
  546. llama.common.fixedsizequeue-1
  547. </a>
  548. </li>
  549. <li class="md-nav__item">
  550. <a href="../xmldocs/llama.common.inferenceparams/" class="md-nav__link">
  551. llama.common.inferenceparams
  552. </a>
  553. </li>
  554. <li class="md-nav__item">
  555. <a href="../xmldocs/llama.common.mirostattype/" class="md-nav__link">
  556. llama.common.mirostattype
  557. </a>
  558. </li>
  559. <li class="md-nav__item">
  560. <a href="../xmldocs/llama.common.modelparams/" class="md-nav__link">
  561. llama.common.modelparams
  562. </a>
  563. </li>
  564. <li class="md-nav__item">
  565. <a href="../xmldocs/llama.exceptions.grammarexpectedname/" class="md-nav__link">
  566. llama.exceptions.grammarexpectedname
  567. </a>
  568. </li>
  569. <li class="md-nav__item">
  570. <a href="../xmldocs/llama.exceptions.grammarexpectednext/" class="md-nav__link">
  571. llama.exceptions.grammarexpectednext
  572. </a>
  573. </li>
  574. <li class="md-nav__item">
  575. <a href="../xmldocs/llama.exceptions.grammarexpectedprevious/" class="md-nav__link">
  576. llama.exceptions.grammarexpectedprevious
  577. </a>
  578. </li>
  579. <li class="md-nav__item">
  580. <a href="../xmldocs/llama.exceptions.grammarformatexception/" class="md-nav__link">
  581. llama.exceptions.grammarformatexception
  582. </a>
  583. </li>
  584. <li class="md-nav__item">
  585. <a href="../xmldocs/llama.exceptions.grammarunexpectedcharaltelement/" class="md-nav__link">
  586. llama.exceptions.grammarunexpectedcharaltelement
  587. </a>
  588. </li>
  589. <li class="md-nav__item">
  590. <a href="../xmldocs/llama.exceptions.grammarunexpectedcharrngelement/" class="md-nav__link">
  591. llama.exceptions.grammarunexpectedcharrngelement
  592. </a>
  593. </li>
  594. <li class="md-nav__item">
  595. <a href="../xmldocs/llama.exceptions.grammarunexpectedendelement/" class="md-nav__link">
  596. llama.exceptions.grammarunexpectedendelement
  597. </a>
  598. </li>
  599. <li class="md-nav__item">
  600. <a href="../xmldocs/llama.exceptions.grammarunexpectedendofinput/" class="md-nav__link">
  601. llama.exceptions.grammarunexpectedendofinput
  602. </a>
  603. </li>
  604. <li class="md-nav__item">
  605. <a href="../xmldocs/llama.exceptions.grammarunexpectedhexcharscount/" class="md-nav__link">
  606. llama.exceptions.grammarunexpectedhexcharscount
  607. </a>
  608. </li>
  609. <li class="md-nav__item">
  610. <a href="../xmldocs/llama.exceptions.grammarunknownescapecharacter/" class="md-nav__link">
  611. llama.exceptions.grammarunknownescapecharacter
  612. </a>
  613. </li>
  614. <li class="md-nav__item">
  615. <a href="../xmldocs/llama.exceptions.llamadecodeerror/" class="md-nav__link">
  616. llama.exceptions.llamadecodeerror
  617. </a>
  618. </li>
  619. <li class="md-nav__item">
  620. <a href="../xmldocs/llama.exceptions.loadweightsfailedexception/" class="md-nav__link">
  621. llama.exceptions.loadweightsfailedexception
  622. </a>
  623. </li>
  624. <li class="md-nav__item">
  625. <a href="../xmldocs/llama.exceptions.runtimeerror/" class="md-nav__link">
  626. llama.exceptions.runtimeerror
  627. </a>
  628. </li>
  629. <li class="md-nav__item">
  630. <a href="../xmldocs/llama.extensions.icontextparamsextensions/" class="md-nav__link">
  631. llama.extensions.icontextparamsextensions
  632. </a>
  633. </li>
  634. <li class="md-nav__item">
  635. <a href="../xmldocs/llama.extensions.imodelparamsextensions/" class="md-nav__link">
  636. llama.extensions.imodelparamsextensions
  637. </a>
  638. </li>
  639. <li class="md-nav__item">
  640. <a href="../xmldocs/llama.grammars.grammar/" class="md-nav__link">
  641. llama.grammars.grammar
  642. </a>
  643. </li>
  644. <li class="md-nav__item">
  645. <a href="../xmldocs/llama.grammars.grammarrule/" class="md-nav__link">
  646. llama.grammars.grammarrule
  647. </a>
  648. </li>
  649. <li class="md-nav__item">
  650. <a href="../xmldocs/llama.ichatmodel/" class="md-nav__link">
  651. llama.ichatmodel
  652. </a>
  653. </li>
  654. <li class="md-nav__item">
  655. <a href="../xmldocs/llama.llamacache/" class="md-nav__link">
  656. llama.llamacache
  657. </a>
  658. </li>
  659. <li class="md-nav__item">
  660. <a href="../xmldocs/llama.llamaembedder/" class="md-nav__link">
  661. llama.llamaembedder
  662. </a>
  663. </li>
  664. <li class="md-nav__item">
  665. <a href="../xmldocs/llama.llamamodel/" class="md-nav__link">
  666. llama.llamamodel
  667. </a>
  668. </li>
  669. <li class="md-nav__item">
  670. <a href="../xmldocs/llama.llamamodelv1/" class="md-nav__link">
  671. llama.llamamodelv1
  672. </a>
  673. </li>
  674. <li class="md-nav__item">
  675. <a href="../xmldocs/llama.llamaparams/" class="md-nav__link">
  676. llama.llamaparams
  677. </a>
  678. </li>
  679. <li class="md-nav__item">
  680. <a href="../xmldocs/llama.llamaquantizer/" class="md-nav__link">
  681. llama.llamaquantizer
  682. </a>
  683. </li>
  684. <li class="md-nav__item">
  685. <a href="../xmldocs/llama.llamastate/" class="md-nav__link">
  686. llama.llamastate
  687. </a>
  688. </li>
  689. <li class="md-nav__item">
  690. <a href="../xmldocs/llama.llamatransforms/" class="md-nav__link">
  691. llama.llamatransforms
  692. </a>
  693. </li>
  694. <li class="md-nav__item">
  695. <a href="../xmldocs/llama.llavaweights/" class="md-nav__link">
  696. llama.llavaweights
  697. </a>
  698. </li>
  699. <li class="md-nav__item">
  700. <a href="../xmldocs/llama.native.decoderesult/" class="md-nav__link">
  701. llama.native.decoderesult
  702. </a>
  703. </li>
  704. <li class="md-nav__item">
  705. <a href="../xmldocs/llama.native.ggmltype/" class="md-nav__link">
  706. llama.native.ggmltype
  707. </a>
  708. </li>
  709. <li class="md-nav__item">
  710. <a href="../xmldocs/llama.native.gpusplitmode/" class="md-nav__link">
  711. llama.native.gpusplitmode
  712. </a>
  713. </li>
  714. <li class="md-nav__item">
  715. <a href="../xmldocs/llama.native.llamabatch/" class="md-nav__link">
  716. llama.native.llamabatch
  717. </a>
  718. </li>
  719. <li class="md-nav__item">
  720. <a href="../xmldocs/llama.native.llamabeamsstate/" class="md-nav__link">
  721. llama.native.llamabeamsstate
  722. </a>
  723. </li>
  724. <li class="md-nav__item">
  725. <a href="../xmldocs/llama.native.llamabeamview/" class="md-nav__link">
  726. llama.native.llamabeamview
  727. </a>
  728. </li>
  729. <li class="md-nav__item">
  730. <a href="../xmldocs/llama.native.llamachatmessage/" class="md-nav__link">
  731. llama.native.llamachatmessage
  732. </a>
  733. </li>
  734. <li class="md-nav__item">
  735. <a href="../xmldocs/llama.native.llamacontextparams/" class="md-nav__link">
  736. llama.native.llamacontextparams
  737. </a>
  738. </li>
  739. <li class="md-nav__item">
  740. <a href="../xmldocs/llama.native.llamaftype/" class="md-nav__link">
  741. llama.native.llamaftype
  742. </a>
  743. </li>
  744. <li class="md-nav__item">
  745. <a href="../xmldocs/llama.native.llamagrammarelement/" class="md-nav__link">
  746. llama.native.llamagrammarelement
  747. </a>
  748. </li>
  749. <li class="md-nav__item">
  750. <a href="../xmldocs/llama.native.llamagrammarelementtype/" class="md-nav__link">
  751. llama.native.llamagrammarelementtype
  752. </a>
  753. </li>
  754. <li class="md-nav__item">
  755. <a href="../xmldocs/llama.native.llamakvcacheview/" class="md-nav__link">
  756. llama.native.llamakvcacheview
  757. </a>
  758. </li>
  759. <li class="md-nav__item">
  760. <a href="../xmldocs/llama.native.llamakvcacheviewcell/" class="md-nav__link">
  761. llama.native.llamakvcacheviewcell
  762. </a>
  763. </li>
  764. <li class="md-nav__item">
  765. <a href="../xmldocs/llama.native.llamakvcacheviewsafehandle/" class="md-nav__link">
  766. llama.native.llamakvcacheviewsafehandle
  767. </a>
  768. </li>
  769. <li class="md-nav__item">
  770. <a href="../xmldocs/llama.native.llamaloglevel/" class="md-nav__link">
  771. llama.native.llamaloglevel
  772. </a>
  773. </li>
  774. <li class="md-nav__item">
  775. <a href="../xmldocs/llama.native.llamamodelkvoverridetype/" class="md-nav__link">
  776. llama.native.llamamodelkvoverridetype
  777. </a>
  778. </li>
  779. <li class="md-nav__item">
  780. <a href="../xmldocs/llama.native.llamamodelmetadataoverride/" class="md-nav__link">
  781. llama.native.llamamodelmetadataoverride
  782. </a>
  783. </li>
  784. <li class="md-nav__item">
  785. <a href="../xmldocs/llama.native.llamamodelparams/" class="md-nav__link">
  786. llama.native.llamamodelparams
  787. </a>
  788. </li>
  789. <li class="md-nav__item">
  790. <a href="../xmldocs/llama.native.llamamodelquantizeparams/" class="md-nav__link">
  791. llama.native.llamamodelquantizeparams
  792. </a>
  793. </li>
  794. <li class="md-nav__item">
  795. <a href="../xmldocs/llama.native.llamanativebatch/" class="md-nav__link">
  796. llama.native.llamanativebatch
  797. </a>
  798. </li>
  799. <li class="md-nav__item">
  800. <a href="../xmldocs/llama.native.llamapoolingtype/" class="md-nav__link">
  801. llama.native.llamapoolingtype
  802. </a>
  803. </li>
  804. <li class="md-nav__item">
  805. <a href="../xmldocs/llama.native.llamapos/" class="md-nav__link">
  806. llama.native.llamapos
  807. </a>
  808. </li>
  809. <li class="md-nav__item">
  810. <a href="../xmldocs/llama.native.llamaropetype/" class="md-nav__link">
  811. llama.native.llamaropetype
  812. </a>
  813. </li>
  814. <li class="md-nav__item">
  815. <a href="../xmldocs/llama.native.llamaseqid/" class="md-nav__link">
  816. llama.native.llamaseqid
  817. </a>
  818. </li>
  819. <li class="md-nav__item">
  820. <a href="../xmldocs/llama.native.llamatoken/" class="md-nav__link">
  821. llama.native.llamatoken
  822. </a>
  823. </li>
  824. <li class="md-nav__item">
  825. <a href="../xmldocs/llama.native.llamatokendata/" class="md-nav__link">
  826. llama.native.llamatokendata
  827. </a>
  828. </li>
  829. <li class="md-nav__item">
  830. <a href="../xmldocs/llama.native.llamatokendataarray/" class="md-nav__link">
  831. llama.native.llamatokendataarray
  832. </a>
  833. </li>
  834. <li class="md-nav__item">
  835. <a href="../xmldocs/llama.native.llamatokendataarraynative/" class="md-nav__link">
  836. llama.native.llamatokendataarraynative
  837. </a>
  838. </li>
  839. <li class="md-nav__item">
  840. <a href="../xmldocs/llama.native.llamatokentype/" class="md-nav__link">
  841. llama.native.llamatokentype
  842. </a>
  843. </li>
  844. <li class="md-nav__item">
  845. <a href="../xmldocs/llama.native.llamavocabtype/" class="md-nav__link">
  846. llama.native.llamavocabtype
  847. </a>
  848. </li>
  849. <li class="md-nav__item">
  850. <a href="../xmldocs/llama.native.llavaimageembed/" class="md-nav__link">
  851. llama.native.llavaimageembed
  852. </a>
  853. </li>
  854. <li class="md-nav__item">
  855. <a href="../xmldocs/llama.native.nativeapi/" class="md-nav__link">
  856. llama.native.nativeapi
  857. </a>
  858. </li>
  859. <li class="md-nav__item">
  860. <a href="../xmldocs/llama.native.nativelibraryconfig/" class="md-nav__link">
  861. llama.native.nativelibraryconfig
  862. </a>
  863. </li>
  864. <li class="md-nav__item">
  865. <a href="../xmldocs/llama.native.ropescalingtype/" class="md-nav__link">
  866. llama.native.ropescalingtype
  867. </a>
  868. </li>
  869. <li class="md-nav__item">
  870. <a href="../xmldocs/llama.native.safellamacontexthandle/" class="md-nav__link">
  871. llama.native.safellamacontexthandle
  872. </a>
  873. </li>
  874. <li class="md-nav__item">
  875. <a href="../xmldocs/llama.native.safellamagrammarhandle/" class="md-nav__link">
  876. llama.native.safellamagrammarhandle
  877. </a>
  878. </li>
  879. <li class="md-nav__item">
  880. <a href="../xmldocs/llama.native.safellamahandlebase/" class="md-nav__link">
  881. llama.native.safellamahandlebase
  882. </a>
  883. </li>
  884. <li class="md-nav__item">
  885. <a href="../xmldocs/llama.native.safellamamodelhandle/" class="md-nav__link">
  886. llama.native.safellamamodelhandle
  887. </a>
  888. </li>
  889. <li class="md-nav__item">
  890. <a href="../xmldocs/llama.native.safellavaimageembedhandle/" class="md-nav__link">
  891. llama.native.safellavaimageembedhandle
  892. </a>
  893. </li>
  894. <li class="md-nav__item">
  895. <a href="../xmldocs/llama.native.safellavamodelhandle/" class="md-nav__link">
  896. llama.native.safellavamodelhandle
  897. </a>
  898. </li>
  899. <li class="md-nav__item">
  900. <a href="../xmldocs/llama.quantizer/" class="md-nav__link">
  901. llama.quantizer
  902. </a>
  903. </li>
  904. <li class="md-nav__item">
  905. <a href="../xmldocs/llama.sampling.basesamplingpipeline/" class="md-nav__link">
  906. llama.sampling.basesamplingpipeline
  907. </a>
  908. </li>
  909. <li class="md-nav__item">
  910. <a href="../xmldocs/llama.sampling.defaultsamplingpipeline/" class="md-nav__link">
  911. llama.sampling.defaultsamplingpipeline
  912. </a>
  913. </li>
  914. <li class="md-nav__item">
  915. <a href="../xmldocs/llama.sampling.greedysamplingpipeline/" class="md-nav__link">
  916. llama.sampling.greedysamplingpipeline
  917. </a>
  918. </li>
  919. <li class="md-nav__item">
  920. <a href="../xmldocs/llama.sampling.isamplingpipeline/" class="md-nav__link">
  921. llama.sampling.isamplingpipeline
  922. </a>
  923. </li>
  924. <li class="md-nav__item">
  925. <a href="../xmldocs/llama.sampling.isamplingpipelineextensions/" class="md-nav__link">
  926. llama.sampling.isamplingpipelineextensions
  927. </a>
  928. </li>
  929. <li class="md-nav__item">
  930. <a href="../xmldocs/llama.sampling.mirostate2samplingpipeline/" class="md-nav__link">
  931. llama.sampling.mirostate2samplingpipeline
  932. </a>
  933. </li>
  934. <li class="md-nav__item">
  935. <a href="../xmldocs/llama.sampling.mirostatesamplingpipeline/" class="md-nav__link">
  936. llama.sampling.mirostatesamplingpipeline
  937. </a>
  938. </li>
  939. <li class="md-nav__item">
  940. <a href="../xmldocs/llama.sessionstate/" class="md-nav__link">
  941. llama.sessionstate
  942. </a>
  943. </li>
  944. <li class="md-nav__item">
  945. <a href="../xmldocs/llama.streamingtokendecoder/" class="md-nav__link">
  946. llama.streamingtokendecoder
  947. </a>
  948. </li>
  949. <li class="md-nav__item">
  950. <a href="../xmldocs/llama.types.chatcompletion/" class="md-nav__link">
  951. llama.types.chatcompletion
  952. </a>
  953. </li>
  954. <li class="md-nav__item">
  955. <a href="../xmldocs/llama.types.chatcompletionchoice/" class="md-nav__link">
  956. llama.types.chatcompletionchoice
  957. </a>
  958. </li>
  959. <li class="md-nav__item">
  960. <a href="../xmldocs/llama.types.chatcompletionchunk/" class="md-nav__link">
  961. llama.types.chatcompletionchunk
  962. </a>
  963. </li>
  964. <li class="md-nav__item">
  965. <a href="../xmldocs/llama.types.chatcompletionchunkchoice/" class="md-nav__link">
  966. llama.types.chatcompletionchunkchoice
  967. </a>
  968. </li>
  969. <li class="md-nav__item">
  970. <a href="../xmldocs/llama.types.chatcompletionchunkdelta/" class="md-nav__link">
  971. llama.types.chatcompletionchunkdelta
  972. </a>
  973. </li>
  974. <li class="md-nav__item">
  975. <a href="../xmldocs/llama.types.chatcompletionmessage/" class="md-nav__link">
  976. llama.types.chatcompletionmessage
  977. </a>
  978. </li>
  979. <li class="md-nav__item">
  980. <a href="../xmldocs/llama.types.chatmessagerecord/" class="md-nav__link">
  981. llama.types.chatmessagerecord
  982. </a>
  983. </li>
  984. <li class="md-nav__item">
  985. <a href="../xmldocs/llama.types.chatrole/" class="md-nav__link">
  986. llama.types.chatrole
  987. </a>
  988. </li>
  989. <li class="md-nav__item">
  990. <a href="../xmldocs/llama.types.completion/" class="md-nav__link">
  991. llama.types.completion
  992. </a>
  993. </li>
  994. <li class="md-nav__item">
  995. <a href="../xmldocs/llama.types.completionchoice/" class="md-nav__link">
  996. llama.types.completionchoice
  997. </a>
  998. </li>
  999. <li class="md-nav__item">
  1000. <a href="../xmldocs/llama.types.completionchunk/" class="md-nav__link">
  1001. llama.types.completionchunk
  1002. </a>
  1003. </li>
  1004. <li class="md-nav__item">
  1005. <a href="../xmldocs/llama.types.completionlogprobs/" class="md-nav__link">
  1006. llama.types.completionlogprobs
  1007. </a>
  1008. </li>
  1009. <li class="md-nav__item">
  1010. <a href="../xmldocs/llama.types.completionusage/" class="md-nav__link">
  1011. llama.types.completionusage
  1012. </a>
  1013. </li>
  1014. <li class="md-nav__item">
  1015. <a href="../xmldocs/llama.types.embedding/" class="md-nav__link">
  1016. llama.types.embedding
  1017. </a>
  1018. </li>
  1019. <li class="md-nav__item">
  1020. <a href="../xmldocs/llama.types.embeddingdata/" class="md-nav__link">
  1021. llama.types.embeddingdata
  1022. </a>
  1023. </li>
  1024. <li class="md-nav__item">
  1025. <a href="../xmldocs/llama.types.embeddingusage/" class="md-nav__link">
  1026. llama.types.embeddingusage
  1027. </a>
  1028. </li>
  1029. <li class="md-nav__item">
  1030. <a href="../xmldocs/logger/" class="md-nav__link">
  1031. logger
  1032. </a>
  1033. </li>
  1034. </ul>
  1035. </nav>
  1036. </li>
  1037. </ul>
  1038. </nav>
  1039. </div>
  1040. </div>
  1041. </div>
  1042. <div class="md-sidebar md-sidebar--secondary" data-md-component="sidebar" data-md-type="toc" >
  1043. <div class="md-sidebar__scrollwrap">
  1044. <div class="md-sidebar__inner">
  1045. <nav class="md-nav md-nav--secondary" aria-label="Table of contents">
  1046. <label class="md-nav__title" for="__toc">
  1047. <span class="md-nav__icon md-icon"></span>
  1048. Table of contents
  1049. </label>
  1050. <ul class="md-nav__list" data-md-component="toc" data-md-scrollfix>
  1051. <li class="md-nav__item">
  1052. <a href="#why-gpu-is-not-used-when-i-have-installed-cuda" class="md-nav__link">
  1053. Why GPU is not used when I have installed CUDA
  1054. </a>
  1055. </li>
  1056. <li class="md-nav__item">
  1057. <a href="#why-the-inference-is-slow" class="md-nav__link">
  1058. Why the inference is slow
  1059. </a>
  1060. </li>
  1061. <li class="md-nav__item">
  1062. <a href="#why-the-program-crashes-before-any-output-is-generated" class="md-nav__link">
  1063. Why the program crashes before any output is generated
  1064. </a>
  1065. </li>
  1066. <li class="md-nav__item">
  1067. <a href="#why-my-model-is-generating-output-infinitely" class="md-nav__link">
  1068. Why my model is generating output infinitely
  1069. </a>
  1070. </li>
  1071. <li class="md-nav__item">
  1072. <a href="#how-to-run-llm-with-non-english-languages" class="md-nav__link">
  1073. How to run LLM with non-English languages
  1074. </a>
  1075. </li>
  1076. <li class="md-nav__item">
  1077. <a href="#pay-attention-to-the-length-of-prompt" class="md-nav__link">
  1078. Pay attention to the length of prompt
  1079. </a>
  1080. </li>
  1081. <li class="md-nav__item">
  1082. <a href="#choose-models-weight-depending-on-you-task" class="md-nav__link">
  1083. Choose models weight depending on you task
  1084. </a>
  1085. </li>
  1086. </ul>
  1087. </nav>
  1088. </div>
  1089. </div>
  1090. </div>
  1091. <div class="md-content" data-md-component="content">
  1092. <article class="md-content__inner md-typeset">
  1093. <h1 id="frequently-asked-qustions">Frequently asked qustions</h1>
  1094. <p>Sometimes, your application with LLM and LLamaSharp may have unexpected behaviours. Here are some frequently asked questions, which may help you to deal with your problem.</p>
  1095. <h2 id="why-gpu-is-not-used-when-i-have-installed-cuda">Why GPU is not used when I have installed CUDA</h2>
  1096. <ol>
  1097. <li>If you are using backend packages, please make sure you have installed the cuda backend package which matches the cuda version of your device. Please note that before LLamaSharp v0.10.0, only one backend package should be installed.</li>
  1098. <li>Add <code>NativeLibraryConfig.Instance.WithLogs(LLamaLogLevel.Info)</code> to the very beginning of your code. The log will show which native library file is loaded. If the CPU library is loaded, please try to compile the native library yourself and open an issue for that. If the CUDA libraty is loaded, please check if <code>GpuLayerCount &gt; 0</code> when loading the model weight.</li>
  1099. </ol>
  1100. <h2 id="why-the-inference-is-slow">Why the inference is slow</h2>
  1101. <p>Firstly, due to the large size of LLM models, it requires more time to generate outputs than other models, especially when you are using models larger than 30B.</p>
  1102. <p>To see if that's a LLamaSharp performance issue, please follow the two tips below.</p>
  1103. <ol>
  1104. <li>If you are using CUDA, Metal or OpenCL, please set <code>GpuLayerCount</code> as large as possible.</li>
  1105. <li>If it's still slower than you expect it to be, please try to run the same model with same setting in <a href="https://github.com/ggerganov/llama.cpp/tree/master/examples">llama.cpp examples</a>. If llama.cpp outperforms LLamaSharp significantly, it's likely a LLamaSharp BUG and please report us for that.</li>
  1106. </ol>
  1107. <h2 id="why-the-program-crashes-before-any-output-is-generated">Why the program crashes before any output is generated</h2>
  1108. <p>Generally, there are two possible cases for this problem:</p>
  1109. <ol>
  1110. <li>The native library (backend) you are using is not compatible with the LLamaSharp version. If you compiled the native library yourself, please make sure you have checkouted llama.cpp to the corresponding commit of LLamaSharp, which could be found at the bottom of README.</li>
  1111. <li>The model file you are using is not compatible with the backend. If you are using a GGUF file downloaded from huggingface, please check its publishing time.</li>
  1112. </ol>
  1113. <h2 id="why-my-model-is-generating-output-infinitely">Why my model is generating output infinitely</h2>
  1114. <p>Please set anti-prompt or max-length when executing the inference.</p>
  1115. <p>Anti-prompt can also be called as "Stop-keyword", which decides when to stop the response generation. Under interactive mode, the maximum tokens count is always not set, which makes the LLM generates responses infinitively. Therefore, setting anti-prompt correctly helps a lot to avoid the strange behaviours. For example, the prompt file <code>chat-with-bob.txt</code> has the following content:</p>
  1116. <pre><code>Transcript of a dialog, where the User interacts with an Assistant named Bob. Bob is helpful, kind, honest, good at writing, and never fails to answer the User's requests immediately and with precision.
  1117. User: Hello, Bob.
  1118. Bob: Hello. How may I help you today?
  1119. User: Please tell me the largest city in Europe.
  1120. Bob: Sure. The largest city in Europe is Moscow, the capital of Russia.
  1121. User:
  1122. </code></pre>
  1123. <p>Therefore, the anti-prompt should be set as "User:". If the last line of the prompt is removed, LLM will automatically generate a question (user) and a response (bob) for one time when running the chat session. Therefore, the antiprompt is suggested to be appended to the prompt when starting a chat session.</p>
  1124. <p>What if an extra line is appended? The string "User:" in the prompt will be followed with a char "\n". Thus when running the model, the automatic generation of a pair of question and response may appear because the anti-prompt is "User:" but the last token is "User:\n". As for whether it will appear, it's an undefined behaviour, which depends on the implementation inside the <code>LLamaExecutor</code>. Anyway, since it may leads to unexpected behaviors, it's recommended to trim your prompt or carefully keep consistent with your anti-prompt.</p>
  1125. <h2 id="how-to-run-llm-with-non-english-languages">How to run LLM with non-English languages</h2>
  1126. <p>English is the most popular language in the world, and in the region of LLM. If you want to accept inputs and generate outputs of other languages, please follow the two tips below.</p>
  1127. <ol>
  1128. <li>Ensure the model you selected is well-trained with data of your language. For example, <a href="https://github.com/meta-llama/llama">LLaMA</a> (original) used few Chinese text during the pretrain, while <a href="https://github.com/ymcui/Chinese-LLaMA-Alpaca">Chinese-LLaMA-Alpaca</a> finetuned LLaMA with a large amount of Chinese text data. Therefore, the quality of the output of Chinese-LLaMA-Alpaca is much better than that of LLaMA.</li>
  1129. </ol>
  1130. <h2 id="pay-attention-to-the-length-of-prompt">Pay attention to the length of prompt</h2>
  1131. <p>Sometimes we want to input a long prompt to execute a task. However, the context size may limit the inference of LLama model. Please ensure the inequality below holds.</p>
  1132. <p>$$ len(prompt) + len(response) &lt; len(context) $$</p>
  1133. <p>In this inequality, <code>len(response)</code> refers to the expected tokens for LLM to generate.</p>
  1134. <h2 id="choose-models-weight-depending-on-you-task">Choose models weight depending on you task</h2>
  1135. <p>The differences between modes may lead to much different behaviours under the same task. For example, if you're building a chat bot with non-English, a fine-tuned model specially for the language you want to use will have huge effect on the performance.</p>
  1136. </article>
  1137. </div>
  1138. </div>
  1139. </main>
  1140. <footer class="md-footer">
  1141. <div class="md-footer-meta md-typeset">
  1142. <div class="md-footer-meta__inner md-grid">
  1143. <div class="md-copyright">
  1144. Made with
  1145. <a href="https://squidfunk.github.io/mkdocs-material/" target="_blank" rel="noopener">
  1146. Material for MkDocs
  1147. </a>
  1148. </div>
  1149. </div>
  1150. </div>
  1151. </footer>
  1152. </div>
  1153. <div class="md-dialog" data-md-component="dialog">
  1154. <div class="md-dialog__inner md-typeset"></div>
  1155. </div>
  1156. <script id="__config" type="application/json">{"base": "..", "features": [], "search": "../assets/javascripts/workers/search.74e28a9f.min.js", "translations": {"clipboard.copied": "Copied to clipboard", "clipboard.copy": "Copy to clipboard", "search.result.more.one": "1 more on this page", "search.result.more.other": "# more on this page", "search.result.none": "No matching documents", "search.result.one": "1 matching document", "search.result.other": "# matching documents", "search.result.placeholder": "Type to start searching", "search.result.term.missing": "Missing", "select.version": "Select version"}, "version": {"provider": "mike"}}</script>
  1157. <script src="../assets/javascripts/bundle.220ee61c.min.js"></script>
  1158. </body>
  1159. </html>

C#/.NET上易用的LLM高性能推理框架,支持LLaMA和LLaVA系列模型。

Contributors (1)