You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

index.html 63 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322232323242325232623272328232923302331233223332334233523362337233823392340234123422343234423452346234723482349235023512352235323542355235623572358235923602361236223632364236523662367236823692370237123722373237423752376237723782379238023812382238323842385238623872388238923902391239223932394239523962397239823992400240124022403240424052406240724082409241024112412241324142415241624172418241924202421242224232424242524262427242824292430243124322433243424352436243724382439244024412442244324442445244624472448244924502451245224532454245524562457245824592460246124622463246424652466246724682469247024712472247324742475247624772478247924802481248224832484248524862487248824892490249124922493249424952496249724982499250025012502250325042505250625072508250925102511251225132514251525162517251825192520252125222523252425252526252725282529253025312532253325342535253625372538253925402541254225432544254525462547254825492550255125522553255425552556255725582559256025612562256325642565256625672568256925702571257225732574257525762577257825792580258125822583258425852586258725882589259025912592259325942595259625972598259926002601260226032604260526062607260826092610261126122613261426152616261726182619262026212622262326242625262626272628262926302631263226332634263526362637263826392640264126422643264426452646264726482649265026512652265326542655265626572658265926602661266226632664266526662667266826692670267126722673267426752676267726782679268026812682268326842685268626872688268926902691269226932694269526962697269826992700270127022703270427052706270727082709271027112712271327142715271627172718271927202721272227232724272527262727272827292730273127322733273427352736273727382739274027412742274327442745274627472748274927502751275227532754275527562757275827592760276127622763276427652766276727682769277027712772277327742775277627772778277927802781278227832784278527862787278827892790279127922793279427952796279727982799280028012802280328042805280628072808280928102811281228132814281528162817281828192820282128222823282428252826282728282829283028312832283328342835283628372838283928402841284228432844284528462847284828492850285128522853285428552856285728582859286028612862286328642865286628672868286928702871287228732874287528762877287828792880288128822883288428852886288728882889289028912892289328942895289628972898289929002901290229032904290529062907290829092910291129122913291429152916291729182919292029212922292329242925292629272928292929302931293229332934293529362937293829392940294129422943294429452946294729482949295029512952295329542955
  1. <!doctype html>
  2. <html lang="en" class="no-js">
  3. <head>
  4. <meta charset="utf-8">
  5. <meta name="viewport" content="width=device-width,initial-scale=1">
  6. <link rel="prev" href="../Architecture/">
  7. <link rel="next" href="../ContributingGuide/">
  8. <link rel="icon" href="../media/icon128.png">
  9. <meta name="generator" content="mkdocs-1.4.3, mkdocs-material-9.1.20">
  10. <title>FAQ - LLamaSharp Documentation</title>
  11. <link rel="stylesheet" href="../assets/stylesheets/main.eebd395e.min.css">
  12. <link rel="stylesheet" href="../assets/stylesheets/palette.ecc896b0.min.css">
  13. <link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
  14. <link rel="stylesheet" href="https://fonts.googleapis.com/css?family=Fira+Sans:300,300i,400,400i,700,700i%7CFira+Mono:400,400i,700,700i&display=fallback">
  15. <style>:root{--md-text-font:"Fira Sans";--md-code-font:"Fira Mono"}</style>
  16. <link rel="stylesheet" href="../css/extra.css?v=14">
  17. <script>__md_scope=new URL("..",location),__md_hash=e=>[...e].reduce((e,_)=>(e<<5)-e+_.charCodeAt(0),0),__md_get=(e,_=localStorage,t=__md_scope)=>JSON.parse(_.getItem(t.pathname+"."+e)),__md_set=(e,_,t=localStorage,a=__md_scope)=>{try{t.setItem(a.pathname+"."+e,JSON.stringify(_))}catch(e){}}</script>
  18. </head>
  19. <body dir="ltr" data-md-color-scheme="default" data-md-color-primary="white" data-md-color-accent="red">
  20. <script>var palette=__md_get("__palette");if(palette&&"object"==typeof palette.color)for(var key of Object.keys(palette.color))document.body.setAttribute("data-md-color-"+key,palette.color[key])</script>
  21. <input class="md-toggle" data-md-toggle="drawer" type="checkbox" id="__drawer" autocomplete="off">
  22. <input class="md-toggle" data-md-toggle="search" type="checkbox" id="__search" autocomplete="off">
  23. <label class="md-overlay" for="__drawer"></label>
  24. <div data-md-component="skip">
  25. <a href="#frequently-asked-qustions" class="md-skip">
  26. Skip to content
  27. </a>
  28. </div>
  29. <div data-md-component="announce">
  30. </div>
  31. <div data-md-color-scheme="default" data-md-component="outdated" hidden>
  32. </div>
  33. <header class="md-header md-header--shadow" data-md-component="header">
  34. <nav class="md-header__inner md-grid" aria-label="Header">
  35. <a href=".." title="LLamaSharp Documentation" class="md-header__button md-logo" aria-label="LLamaSharp Documentation" data-md-component="logo">
  36. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M13 9h5.5L13 3.5V9M6 2h8l6 6v12a2 2 0 0 1-2 2H6a2 2 0 0 1-2-2V4c0-1.11.89-2 2-2m9 16v-2H6v2h9m3-4v-2H6v2h12Z"/></svg>
  37. </a>
  38. <label class="md-header__button md-icon" for="__drawer">
  39. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M3 6h18v2H3V6m0 5h18v2H3v-2m0 5h18v2H3v-2Z"/></svg>
  40. </label>
  41. <div class="md-header__title" data-md-component="header-title">
  42. <div class="md-header__ellipsis">
  43. <div class="md-header__topic">
  44. <span class="md-ellipsis">
  45. LLamaSharp Documentation
  46. </span>
  47. </div>
  48. <div class="md-header__topic" data-md-component="header-topic">
  49. <span class="md-ellipsis">
  50. FAQ
  51. </span>
  52. </div>
  53. </div>
  54. </div>
  55. <form class="md-header__option" data-md-component="palette">
  56. <input class="md-option" data-md-color-media="(prefers-color-scheme: light)" data-md-color-scheme="default" data-md-color-primary="white" data-md-color-accent="red" aria-label="Switch to dark mode" type="radio" name="__palette" id="__palette_1">
  57. <label class="md-header__button md-icon" title="Switch to dark mode" for="__palette_2" hidden>
  58. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M12 7a5 5 0 0 1 5 5 5 5 0 0 1-5 5 5 5 0 0 1-5-5 5 5 0 0 1 5-5m0 2a3 3 0 0 0-3 3 3 3 0 0 0 3 3 3 3 0 0 0 3-3 3 3 0 0 0-3-3m0-7 2.39 3.42C13.65 5.15 12.84 5 12 5c-.84 0-1.65.15-2.39.42L12 2M3.34 7l4.16-.35A7.2 7.2 0 0 0 5.94 8.5c-.44.74-.69 1.5-.83 2.29L3.34 7m.02 10 1.76-3.77a7.131 7.131 0 0 0 2.38 4.14L3.36 17M20.65 7l-1.77 3.79a7.023 7.023 0 0 0-2.38-4.15l4.15.36m-.01 10-4.14.36c.59-.51 1.12-1.14 1.54-1.86.42-.73.69-1.5.83-2.29L20.64 17M12 22l-2.41-3.44c.74.27 1.55.44 2.41.44.82 0 1.63-.17 2.37-.44L12 22Z"/></svg>
  59. </label>
  60. <input class="md-option" data-md-color-media="(prefers-color-scheme: dark)" data-md-color-scheme="slate" data-md-color-primary="blue" data-md-color-accent="blue" aria-label="Switch to light mode" type="radio" name="__palette" id="__palette_2">
  61. <label class="md-header__button md-icon" title="Switch to light mode" for="__palette_1" hidden>
  62. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="m17.75 4.09-2.53 1.94.91 3.06-2.63-1.81-2.63 1.81.91-3.06-2.53-1.94L12.44 4l1.06-3 1.06 3 3.19.09m3.5 6.91-1.64 1.25.59 1.98-1.7-1.17-1.7 1.17.59-1.98L15.75 11l2.06-.05L18.5 9l.69 1.95 2.06.05m-2.28 4.95c.83-.08 1.72 1.1 1.19 1.85-.32.45-.66.87-1.08 1.27C15.17 23 8.84 23 4.94 19.07c-3.91-3.9-3.91-10.24 0-14.14.4-.4.82-.76 1.27-1.08.75-.53 1.93.36 1.85 1.19-.27 2.86.69 5.83 2.89 8.02a9.96 9.96 0 0 0 8.02 2.89m-1.64 2.02a12.08 12.08 0 0 1-7.8-3.47c-2.17-2.19-3.33-5-3.49-7.82-2.81 3.14-2.7 7.96.31 10.98 3.02 3.01 7.84 3.12 10.98.31Z"/></svg>
  63. </label>
  64. </form>
  65. <label class="md-header__button md-icon" for="__search">
  66. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M9.5 3A6.5 6.5 0 0 1 16 9.5c0 1.61-.59 3.09-1.56 4.23l.27.27h.79l5 5-1.5 1.5-5-5v-.79l-.27-.27A6.516 6.516 0 0 1 9.5 16 6.5 6.5 0 0 1 3 9.5 6.5 6.5 0 0 1 9.5 3m0 2C7 5 5 7 5 9.5S7 14 9.5 14 14 12 14 9.5 12 5 9.5 5Z"/></svg>
  67. </label>
  68. <div class="md-search" data-md-component="search" role="dialog">
  69. <label class="md-search__overlay" for="__search"></label>
  70. <div class="md-search__inner" role="search">
  71. <form class="md-search__form" name="search">
  72. <input type="text" class="md-search__input" name="query" aria-label="Search" placeholder="Search" autocapitalize="off" autocorrect="off" autocomplete="off" spellcheck="false" data-md-component="search-query" required>
  73. <label class="md-search__icon md-icon" for="__search">
  74. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M9.5 3A6.5 6.5 0 0 1 16 9.5c0 1.61-.59 3.09-1.56 4.23l.27.27h.79l5 5-1.5 1.5-5-5v-.79l-.27-.27A6.516 6.516 0 0 1 9.5 16 6.5 6.5 0 0 1 3 9.5 6.5 6.5 0 0 1 9.5 3m0 2C7 5 5 7 5 9.5S7 14 9.5 14 14 12 14 9.5 12 5 9.5 5Z"/></svg>
  75. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M20 11v2H8l5.5 5.5-1.42 1.42L4.16 12l7.92-7.92L13.5 5.5 8 11h12Z"/></svg>
  76. </label>
  77. <nav class="md-search__options" aria-label="Search">
  78. <button type="reset" class="md-search__icon md-icon" title="Clear" aria-label="Clear" tabindex="-1">
  79. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M19 6.41 17.59 5 12 10.59 6.41 5 5 6.41 10.59 12 5 17.59 6.41 19 12 13.41 17.59 19 19 17.59 13.41 12 19 6.41Z"/></svg>
  80. </button>
  81. </nav>
  82. </form>
  83. <div class="md-search__output">
  84. <div class="md-search__scrollwrap" data-md-scrollfix>
  85. <div class="md-search-result" data-md-component="search-result">
  86. <div class="md-search-result__meta">
  87. Initializing search
  88. </div>
  89. <ol class="md-search-result__list" role="presentation"></ol>
  90. </div>
  91. </div>
  92. </div>
  93. </div>
  94. </div>
  95. </nav>
  96. </header>
  97. <div class="md-container" data-md-component="container">
  98. <main class="md-main" data-md-component="main">
  99. <div class="md-main__inner md-grid">
  100. <div class="md-sidebar md-sidebar--primary" data-md-component="sidebar" data-md-type="navigation" >
  101. <div class="md-sidebar__scrollwrap">
  102. <div class="md-sidebar__inner">
  103. <nav class="md-nav md-nav--primary" aria-label="Navigation" data-md-level="0">
  104. <label class="md-nav__title" for="__drawer">
  105. <a href=".." title="LLamaSharp Documentation" class="md-nav__button md-logo" aria-label="LLamaSharp Documentation" data-md-component="logo">
  106. <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M13 9h5.5L13 3.5V9M6 2h8l6 6v12a2 2 0 0 1-2 2H6a2 2 0 0 1-2-2V4c0-1.11.89-2 2-2m9 16v-2H6v2h9m3-4v-2H6v2h12Z"/></svg>
  107. </a>
  108. LLamaSharp Documentation
  109. </label>
  110. <ul class="md-nav__list" data-md-scrollfix>
  111. <li class="md-nav__item">
  112. <a href=".." class="md-nav__link">
  113. Overview
  114. </a>
  115. </li>
  116. <li class="md-nav__item">
  117. <a href="../QuickStart/" class="md-nav__link">
  118. Quick Start
  119. </a>
  120. </li>
  121. <li class="md-nav__item">
  122. <a href="../Architecture/" class="md-nav__link">
  123. Architecture
  124. </a>
  125. </li>
  126. <li class="md-nav__item md-nav__item--active">
  127. <input class="md-nav__toggle md-toggle" type="checkbox" id="__toc">
  128. <label class="md-nav__link md-nav__link--active" for="__toc">
  129. FAQ
  130. <span class="md-nav__icon md-icon"></span>
  131. </label>
  132. <a href="./" class="md-nav__link md-nav__link--active">
  133. FAQ
  134. </a>
  135. <nav class="md-nav md-nav--secondary" aria-label="Table of contents">
  136. <label class="md-nav__title" for="__toc">
  137. <span class="md-nav__icon md-icon"></span>
  138. Table of contents
  139. </label>
  140. <ul class="md-nav__list" data-md-component="toc" data-md-scrollfix>
  141. <li class="md-nav__item">
  142. <a href="#why-gpu-is-not-used-when-i-have-installed-cuda" class="md-nav__link">
  143. Why GPU is not used when I have installed CUDA
  144. </a>
  145. </li>
  146. <li class="md-nav__item">
  147. <a href="#why-the-inference-is-slow" class="md-nav__link">
  148. Why the inference is slow
  149. </a>
  150. </li>
  151. <li class="md-nav__item">
  152. <a href="#why-the-program-crashes-before-any-output-is-generated" class="md-nav__link">
  153. Why the program crashes before any output is generated
  154. </a>
  155. </li>
  156. <li class="md-nav__item">
  157. <a href="#why-my-model-is-generating-output-infinitely" class="md-nav__link">
  158. Why my model is generating output infinitely
  159. </a>
  160. </li>
  161. <li class="md-nav__item">
  162. <a href="#how-to-run-llm-with-non-english-languages" class="md-nav__link">
  163. How to run LLM with non-English languages
  164. </a>
  165. </li>
  166. <li class="md-nav__item">
  167. <a href="#pay-attention-to-the-length-of-prompt" class="md-nav__link">
  168. Pay attention to the length of prompt
  169. </a>
  170. </li>
  171. <li class="md-nav__item">
  172. <a href="#choose-models-weight-depending-on-you-task" class="md-nav__link">
  173. Choose models weight depending on you task
  174. </a>
  175. </li>
  176. </ul>
  177. </nav>
  178. </li>
  179. <li class="md-nav__item">
  180. <a href="../ContributingGuide/" class="md-nav__link">
  181. Contributing Guide
  182. </a>
  183. </li>
  184. <li class="md-nav__item md-nav__item--nested">
  185. <input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_6" >
  186. <label class="md-nav__link" for="__nav_6" id="__nav_6_label" tabindex="0">
  187. Tutorials
  188. <span class="md-nav__icon md-icon"></span>
  189. </label>
  190. <nav class="md-nav" data-md-level="1" aria-labelledby="__nav_6_label" aria-expanded="false">
  191. <label class="md-nav__title" for="__nav_6">
  192. <span class="md-nav__icon md-icon"></span>
  193. Tutorials
  194. </label>
  195. <ul class="md-nav__list" data-md-scrollfix>
  196. <li class="md-nav__item">
  197. <a href="../Tutorials/NativeLibraryConfig/" class="md-nav__link">
  198. Customize the native library loading
  199. </a>
  200. </li>
  201. <li class="md-nav__item">
  202. <a href="../Tutorials/Executors/" class="md-nav__link">
  203. Use executors
  204. </a>
  205. </li>
  206. <li class="md-nav__item">
  207. <a href="../Tutorials/ChatSession/" class="md-nav__link">
  208. Use ChatSession
  209. </a>
  210. </li>
  211. <li class="md-nav__item">
  212. <a href="../Tutorials/UnderstandLLamaContext/" class="md-nav__link">
  213. Understand LLamaContext
  214. </a>
  215. </li>
  216. <li class="md-nav__item">
  217. <a href="../Tutorials/GetEmbeddings/" class="md-nav__link">
  218. Get embeddings
  219. </a>
  220. </li>
  221. <li class="md-nav__item">
  222. <a href="../Tutorials/Quantization/" class="md-nav__link">
  223. Quantize the model
  224. </a>
  225. </li>
  226. </ul>
  227. </nav>
  228. </li>
  229. <li class="md-nav__item md-nav__item--nested">
  230. <input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_7" >
  231. <label class="md-nav__link" for="__nav_7" id="__nav_7_label" tabindex="0">
  232. Integrations
  233. <span class="md-nav__icon md-icon"></span>
  234. </label>
  235. <nav class="md-nav" data-md-level="1" aria-labelledby="__nav_7_label" aria-expanded="false">
  236. <label class="md-nav__title" for="__nav_7">
  237. <span class="md-nav__icon md-icon"></span>
  238. Integrations
  239. </label>
  240. <ul class="md-nav__list" data-md-scrollfix>
  241. <li class="md-nav__item">
  242. <a href="../Integrations/semantic-kernel/" class="md-nav__link">
  243. semantic-kernel integration
  244. </a>
  245. </li>
  246. <li class="md-nav__item">
  247. <a href="../Integrations/kernel-memory/" class="md-nav__link">
  248. kernel-memory integration
  249. </a>
  250. </li>
  251. <li class="md-nav__item">
  252. <a href="../Integrations/BotSharp.md" class="md-nav__link">
  253. BotSharp integration
  254. </a>
  255. </li>
  256. <li class="md-nav__item">
  257. <a href="../Integrations/Langchain.md" class="md-nav__link">
  258. Langchain integration
  259. </a>
  260. </li>
  261. </ul>
  262. </nav>
  263. </li>
  264. <li class="md-nav__item md-nav__item--nested">
  265. <input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_8" >
  266. <label class="md-nav__link" for="__nav_8" id="__nav_8_label" tabindex="0">
  267. Examples
  268. <span class="md-nav__icon md-icon"></span>
  269. </label>
  270. <nav class="md-nav" data-md-level="1" aria-labelledby="__nav_8_label" aria-expanded="false">
  271. <label class="md-nav__title" for="__nav_8">
  272. <span class="md-nav__icon md-icon"></span>
  273. Examples
  274. </label>
  275. <ul class="md-nav__list" data-md-scrollfix>
  276. <li class="md-nav__item">
  277. <a href="../Examples/BatchedExecutorFork/" class="md-nav__link">
  278. Bacthed executor - multi-output to one input
  279. </a>
  280. </li>
  281. <li class="md-nav__item">
  282. <a href="../Examples/BatchedExecutorGuidance/" class="md-nav__link">
  283. Batched executor - basic guidance
  284. </a>
  285. </li>
  286. <li class="md-nav__item">
  287. <a href="../Examples/BatchedExecutorRewind/" class="md-nav__link">
  288. Batched executor - rewinding to an earlier state
  289. </a>
  290. </li>
  291. <li class="md-nav__item">
  292. <a href="../Examples/ChatChineseGB2312/" class="md-nav__link">
  293. Chinese LLM - with GB2312 encoding
  294. </a>
  295. </li>
  296. <li class="md-nav__item">
  297. <a href="../Examples/ChatSessionStripRoleName/" class="md-nav__link">
  298. ChatSession - stripping role names
  299. </a>
  300. </li>
  301. <li class="md-nav__item">
  302. <a href="../Examples/ChatSessionWithHistory/" class="md-nav__link">
  303. ChatSession - with history
  304. </a>
  305. </li>
  306. <li class="md-nav__item">
  307. <a href="../Examples/ChatSessionWithRestart/" class="md-nav__link">
  308. ChatSession - restarting
  309. </a>
  310. </li>
  311. <li class="md-nav__item">
  312. <a href="../Examples/ChatSessionWithRoleName/" class="md-nav__link">
  313. ChatSession - Basic
  314. </a>
  315. </li>
  316. <li class="md-nav__item">
  317. <a href="../Examples/CodingAssistant/" class="md-nav__link">
  318. Coding assistant
  319. </a>
  320. </li>
  321. <li class="md-nav__item">
  322. <a href="../Examples/GetEmbeddings/" class="md-nav__link">
  323. Get embeddings
  324. </a>
  325. </li>
  326. <li class="md-nav__item">
  327. <a href="../Examples/GrammarJsonResponse/" class="md-nav__link">
  328. Grammar - json response
  329. </a>
  330. </li>
  331. <li class="md-nav__item">
  332. <a href="../Examples/InstructModeExecute/" class="md-nav__link">
  333. Instruct executor - basic
  334. </a>
  335. </li>
  336. <li class="md-nav__item">
  337. <a href="../Examples/InteractiveModeExecute/" class="md-nav__link">
  338. Interactive executor - basic
  339. </a>
  340. </li>
  341. <li class="md-nav__item">
  342. <a href="../Examples/KernelMemory/" class="md-nav__link">
  343. Kernel memory integration - basic
  344. </a>
  345. </li>
  346. <li class="md-nav__item">
  347. <a href="../Examples/KernelMemorySaveAndLoad/" class="md-nav__link">
  348. Kernel-memory - save & load
  349. </a>
  350. </li>
  351. <li class="md-nav__item">
  352. <a href="../Examples/LLavaInteractiveModeExecute/" class="md-nav__link">
  353. LLaVA - basic
  354. </a>
  355. </li>
  356. <li class="md-nav__item">
  357. <a href="../Examples/LoadAndSaveSession/" class="md-nav__link">
  358. ChatSession - load & save
  359. </a>
  360. </li>
  361. <li class="md-nav__item">
  362. <a href="../Examples/LoadAndSaveState/" class="md-nav__link">
  363. Executor - save/load state
  364. </a>
  365. </li>
  366. <li class="md-nav__item">
  367. <a href="../Examples/QuantizeModel/" class="md-nav__link">
  368. Quantization
  369. </a>
  370. </li>
  371. <li class="md-nav__item">
  372. <a href="../Examples/SemanticKernelChat/" class="md-nav__link">
  373. Semantic-kernel - chat
  374. </a>
  375. </li>
  376. <li class="md-nav__item">
  377. <a href="../Examples/SemanticKernelMemory/" class="md-nav__link">
  378. Semantic-kernel - with kernel-memory
  379. </a>
  380. </li>
  381. <li class="md-nav__item">
  382. <a href="../Examples/SemanticKernelPrompt/" class="md-nav__link">
  383. Semantic-kernel - basic
  384. </a>
  385. </li>
  386. <li class="md-nav__item">
  387. <a href="../Examples/StatelessModeExecute/" class="md-nav__link">
  388. Stateless executor
  389. </a>
  390. </li>
  391. <li class="md-nav__item">
  392. <a href="../Examples/TalkToYourself/" class="md-nav__link">
  393. Talk to yourself
  394. </a>
  395. </li>
  396. </ul>
  397. </nav>
  398. </li>
  399. <li class="md-nav__item md-nav__item--nested">
  400. <input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_9" >
  401. <label class="md-nav__link" for="__nav_9" id="__nav_9_label" tabindex="0">
  402. API Reference
  403. <span class="md-nav__icon md-icon"></span>
  404. </label>
  405. <nav class="md-nav" data-md-level="1" aria-labelledby="__nav_9_label" aria-expanded="false">
  406. <label class="md-nav__title" for="__nav_9">
  407. <span class="md-nav__icon md-icon"></span>
  408. API Reference
  409. </label>
  410. <ul class="md-nav__list" data-md-scrollfix>
  411. <li class="md-nav__item">
  412. <a href="../xmldocs/" class="md-nav__link">
  413. index
  414. </a>
  415. </li>
  416. <li class="md-nav__item">
  417. <a href="../xmldocs/llama.abstractions.adaptercollection/" class="md-nav__link">
  418. llama.abstractions.adaptercollection
  419. </a>
  420. </li>
  421. <li class="md-nav__item">
  422. <a href="../xmldocs/llama.abstractions.icontextparams/" class="md-nav__link">
  423. llama.abstractions.icontextparams
  424. </a>
  425. </li>
  426. <li class="md-nav__item">
  427. <a href="../xmldocs/llama.abstractions.ihistorytransform/" class="md-nav__link">
  428. llama.abstractions.ihistorytransform
  429. </a>
  430. </li>
  431. <li class="md-nav__item">
  432. <a href="../xmldocs/llama.abstractions.iinferenceparams/" class="md-nav__link">
  433. llama.abstractions.iinferenceparams
  434. </a>
  435. </li>
  436. <li class="md-nav__item">
  437. <a href="../xmldocs/llama.abstractions.illamaexecutor/" class="md-nav__link">
  438. llama.abstractions.illamaexecutor
  439. </a>
  440. </li>
  441. <li class="md-nav__item">
  442. <a href="../xmldocs/llama.abstractions.illamaparams/" class="md-nav__link">
  443. llama.abstractions.illamaparams
  444. </a>
  445. </li>
  446. <li class="md-nav__item">
  447. <a href="../xmldocs/llama.abstractions.imodelparams/" class="md-nav__link">
  448. llama.abstractions.imodelparams
  449. </a>
  450. </li>
  451. <li class="md-nav__item">
  452. <a href="../xmldocs/llama.abstractions.itextstreamtransform/" class="md-nav__link">
  453. llama.abstractions.itextstreamtransform
  454. </a>
  455. </li>
  456. <li class="md-nav__item">
  457. <a href="../xmldocs/llama.abstractions.itexttransform/" class="md-nav__link">
  458. llama.abstractions.itexttransform
  459. </a>
  460. </li>
  461. <li class="md-nav__item">
  462. <a href="../xmldocs/llama.abstractions.loraadapter/" class="md-nav__link">
  463. llama.abstractions.loraadapter
  464. </a>
  465. </li>
  466. <li class="md-nav__item">
  467. <a href="../xmldocs/llama.abstractions.metadataoverride/" class="md-nav__link">
  468. llama.abstractions.metadataoverride
  469. </a>
  470. </li>
  471. <li class="md-nav__item">
  472. <a href="../xmldocs/llama.abstractions.metadataoverrideconverter/" class="md-nav__link">
  473. llama.abstractions.metadataoverrideconverter
  474. </a>
  475. </li>
  476. <li class="md-nav__item">
  477. <a href="../xmldocs/llama.abstractions.tensorsplitscollection/" class="md-nav__link">
  478. llama.abstractions.tensorsplitscollection
  479. </a>
  480. </li>
  481. <li class="md-nav__item">
  482. <a href="../xmldocs/llama.abstractions.tensorsplitscollectionconverter/" class="md-nav__link">
  483. llama.abstractions.tensorsplitscollectionconverter
  484. </a>
  485. </li>
  486. <li class="md-nav__item">
  487. <a href="../xmldocs/llama.antipromptprocessor/" class="md-nav__link">
  488. llama.antipromptprocessor
  489. </a>
  490. </li>
  491. <li class="md-nav__item">
  492. <a href="../xmldocs/llama.batched.alreadypromptedconversationexception/" class="md-nav__link">
  493. llama.batched.alreadypromptedconversationexception
  494. </a>
  495. </li>
  496. <li class="md-nav__item">
  497. <a href="../xmldocs/llama.batched.batchedexecutor/" class="md-nav__link">
  498. llama.batched.batchedexecutor
  499. </a>
  500. </li>
  501. <li class="md-nav__item">
  502. <a href="../xmldocs/llama.batched.cannotforkwhilerequiresinferenceexception/" class="md-nav__link">
  503. llama.batched.cannotforkwhilerequiresinferenceexception
  504. </a>
  505. </li>
  506. <li class="md-nav__item">
  507. <a href="../xmldocs/llama.batched.cannotmodifywhilerequiresinferenceexception/" class="md-nav__link">
  508. llama.batched.cannotmodifywhilerequiresinferenceexception
  509. </a>
  510. </li>
  511. <li class="md-nav__item">
  512. <a href="../xmldocs/llama.batched.cannotsamplerequiresinferenceexception/" class="md-nav__link">
  513. llama.batched.cannotsamplerequiresinferenceexception
  514. </a>
  515. </li>
  516. <li class="md-nav__item">
  517. <a href="../xmldocs/llama.batched.cannotsamplerequirespromptexception/" class="md-nav__link">
  518. llama.batched.cannotsamplerequirespromptexception
  519. </a>
  520. </li>
  521. <li class="md-nav__item">
  522. <a href="../xmldocs/llama.batched.conversation/" class="md-nav__link">
  523. llama.batched.conversation
  524. </a>
  525. </li>
  526. <li class="md-nav__item">
  527. <a href="../xmldocs/llama.batched.conversationextensions/" class="md-nav__link">
  528. llama.batched.conversationextensions
  529. </a>
  530. </li>
  531. <li class="md-nav__item">
  532. <a href="../xmldocs/llama.batched.experimentalbatchedexecutorexception/" class="md-nav__link">
  533. llama.batched.experimentalbatchedexecutorexception
  534. </a>
  535. </li>
  536. <li class="md-nav__item">
  537. <a href="../xmldocs/llama.chatsession-1/" class="md-nav__link">
  538. llama.chatsession-1
  539. </a>
  540. </li>
  541. <li class="md-nav__item">
  542. <a href="../xmldocs/llama.chatsession/" class="md-nav__link">
  543. llama.chatsession
  544. </a>
  545. </li>
  546. <li class="md-nav__item">
  547. <a href="../xmldocs/llama.common.authorrole/" class="md-nav__link">
  548. llama.common.authorrole
  549. </a>
  550. </li>
  551. <li class="md-nav__item">
  552. <a href="../xmldocs/llama.common.chathistory/" class="md-nav__link">
  553. llama.common.chathistory
  554. </a>
  555. </li>
  556. <li class="md-nav__item">
  557. <a href="../xmldocs/llama.common.fixedsizequeue-1/" class="md-nav__link">
  558. llama.common.fixedsizequeue-1
  559. </a>
  560. </li>
  561. <li class="md-nav__item">
  562. <a href="../xmldocs/llama.common.inferenceparams/" class="md-nav__link">
  563. llama.common.inferenceparams
  564. </a>
  565. </li>
  566. <li class="md-nav__item">
  567. <a href="../xmldocs/llama.common.mirostattype/" class="md-nav__link">
  568. llama.common.mirostattype
  569. </a>
  570. </li>
  571. <li class="md-nav__item">
  572. <a href="../xmldocs/llama.common.modelparams/" class="md-nav__link">
  573. llama.common.modelparams
  574. </a>
  575. </li>
  576. <li class="md-nav__item">
  577. <a href="../xmldocs/llama.exceptions.grammarexpectedname/" class="md-nav__link">
  578. llama.exceptions.grammarexpectedname
  579. </a>
  580. </li>
  581. <li class="md-nav__item">
  582. <a href="../xmldocs/llama.exceptions.grammarexpectednext/" class="md-nav__link">
  583. llama.exceptions.grammarexpectednext
  584. </a>
  585. </li>
  586. <li class="md-nav__item">
  587. <a href="../xmldocs/llama.exceptions.grammarexpectedprevious/" class="md-nav__link">
  588. llama.exceptions.grammarexpectedprevious
  589. </a>
  590. </li>
  591. <li class="md-nav__item">
  592. <a href="../xmldocs/llama.exceptions.grammarformatexception/" class="md-nav__link">
  593. llama.exceptions.grammarformatexception
  594. </a>
  595. </li>
  596. <li class="md-nav__item">
  597. <a href="../xmldocs/llama.exceptions.grammarunexpectedcharaltelement/" class="md-nav__link">
  598. llama.exceptions.grammarunexpectedcharaltelement
  599. </a>
  600. </li>
  601. <li class="md-nav__item">
  602. <a href="../xmldocs/llama.exceptions.grammarunexpectedcharrngelement/" class="md-nav__link">
  603. llama.exceptions.grammarunexpectedcharrngelement
  604. </a>
  605. </li>
  606. <li class="md-nav__item">
  607. <a href="../xmldocs/llama.exceptions.grammarunexpectedendelement/" class="md-nav__link">
  608. llama.exceptions.grammarunexpectedendelement
  609. </a>
  610. </li>
  611. <li class="md-nav__item">
  612. <a href="../xmldocs/llama.exceptions.grammarunexpectedendofinput/" class="md-nav__link">
  613. llama.exceptions.grammarunexpectedendofinput
  614. </a>
  615. </li>
  616. <li class="md-nav__item">
  617. <a href="../xmldocs/llama.exceptions.grammarunexpectedhexcharscount/" class="md-nav__link">
  618. llama.exceptions.grammarunexpectedhexcharscount
  619. </a>
  620. </li>
  621. <li class="md-nav__item">
  622. <a href="../xmldocs/llama.exceptions.grammarunknownescapecharacter/" class="md-nav__link">
  623. llama.exceptions.grammarunknownescapecharacter
  624. </a>
  625. </li>
  626. <li class="md-nav__item">
  627. <a href="../xmldocs/llama.exceptions.llamadecodeerror/" class="md-nav__link">
  628. llama.exceptions.llamadecodeerror
  629. </a>
  630. </li>
  631. <li class="md-nav__item">
  632. <a href="../xmldocs/llama.exceptions.loadweightsfailedexception/" class="md-nav__link">
  633. llama.exceptions.loadweightsfailedexception
  634. </a>
  635. </li>
  636. <li class="md-nav__item">
  637. <a href="../xmldocs/llama.exceptions.runtimeerror/" class="md-nav__link">
  638. llama.exceptions.runtimeerror
  639. </a>
  640. </li>
  641. <li class="md-nav__item">
  642. <a href="../xmldocs/llama.extensions.icontextparamsextensions/" class="md-nav__link">
  643. llama.extensions.icontextparamsextensions
  644. </a>
  645. </li>
  646. <li class="md-nav__item">
  647. <a href="../xmldocs/llama.extensions.imodelparamsextensions/" class="md-nav__link">
  648. llama.extensions.imodelparamsextensions
  649. </a>
  650. </li>
  651. <li class="md-nav__item">
  652. <a href="../xmldocs/llama.grammars.grammar/" class="md-nav__link">
  653. llama.grammars.grammar
  654. </a>
  655. </li>
  656. <li class="md-nav__item">
  657. <a href="../xmldocs/llama.grammars.grammarrule/" class="md-nav__link">
  658. llama.grammars.grammarrule
  659. </a>
  660. </li>
  661. <li class="md-nav__item">
  662. <a href="../xmldocs/llama.ichatmodel/" class="md-nav__link">
  663. llama.ichatmodel
  664. </a>
  665. </li>
  666. <li class="md-nav__item">
  667. <a href="../xmldocs/llama.llamacache/" class="md-nav__link">
  668. llama.llamacache
  669. </a>
  670. </li>
  671. <li class="md-nav__item">
  672. <a href="../xmldocs/llama.llamaembedder/" class="md-nav__link">
  673. llama.llamaembedder
  674. </a>
  675. </li>
  676. <li class="md-nav__item">
  677. <a href="../xmldocs/llama.llamamodel/" class="md-nav__link">
  678. llama.llamamodel
  679. </a>
  680. </li>
  681. <li class="md-nav__item">
  682. <a href="../xmldocs/llama.llamamodelv1/" class="md-nav__link">
  683. llama.llamamodelv1
  684. </a>
  685. </li>
  686. <li class="md-nav__item">
  687. <a href="../xmldocs/llama.llamaparams/" class="md-nav__link">
  688. llama.llamaparams
  689. </a>
  690. </li>
  691. <li class="md-nav__item">
  692. <a href="../xmldocs/llama.llamaquantizer/" class="md-nav__link">
  693. llama.llamaquantizer
  694. </a>
  695. </li>
  696. <li class="md-nav__item">
  697. <a href="../xmldocs/llama.llamastate/" class="md-nav__link">
  698. llama.llamastate
  699. </a>
  700. </li>
  701. <li class="md-nav__item">
  702. <a href="../xmldocs/llama.llamatransforms/" class="md-nav__link">
  703. llama.llamatransforms
  704. </a>
  705. </li>
  706. <li class="md-nav__item">
  707. <a href="../xmldocs/llama.llavaweights/" class="md-nav__link">
  708. llama.llavaweights
  709. </a>
  710. </li>
  711. <li class="md-nav__item">
  712. <a href="../xmldocs/llama.native.decoderesult/" class="md-nav__link">
  713. llama.native.decoderesult
  714. </a>
  715. </li>
  716. <li class="md-nav__item">
  717. <a href="../xmldocs/llama.native.ggmltype/" class="md-nav__link">
  718. llama.native.ggmltype
  719. </a>
  720. </li>
  721. <li class="md-nav__item">
  722. <a href="../xmldocs/llama.native.gpusplitmode/" class="md-nav__link">
  723. llama.native.gpusplitmode
  724. </a>
  725. </li>
  726. <li class="md-nav__item">
  727. <a href="../xmldocs/llama.native.llamabatch/" class="md-nav__link">
  728. llama.native.llamabatch
  729. </a>
  730. </li>
  731. <li class="md-nav__item">
  732. <a href="../xmldocs/llama.native.llamabeamsstate/" class="md-nav__link">
  733. llama.native.llamabeamsstate
  734. </a>
  735. </li>
  736. <li class="md-nav__item">
  737. <a href="../xmldocs/llama.native.llamabeamview/" class="md-nav__link">
  738. llama.native.llamabeamview
  739. </a>
  740. </li>
  741. <li class="md-nav__item">
  742. <a href="../xmldocs/llama.native.llamachatmessage/" class="md-nav__link">
  743. llama.native.llamachatmessage
  744. </a>
  745. </li>
  746. <li class="md-nav__item">
  747. <a href="../xmldocs/llama.native.llamacontextparams/" class="md-nav__link">
  748. llama.native.llamacontextparams
  749. </a>
  750. </li>
  751. <li class="md-nav__item">
  752. <a href="../xmldocs/llama.native.llamaftype/" class="md-nav__link">
  753. llama.native.llamaftype
  754. </a>
  755. </li>
  756. <li class="md-nav__item">
  757. <a href="../xmldocs/llama.native.llamagrammarelement/" class="md-nav__link">
  758. llama.native.llamagrammarelement
  759. </a>
  760. </li>
  761. <li class="md-nav__item">
  762. <a href="../xmldocs/llama.native.llamagrammarelementtype/" class="md-nav__link">
  763. llama.native.llamagrammarelementtype
  764. </a>
  765. </li>
  766. <li class="md-nav__item">
  767. <a href="../xmldocs/llama.native.llamakvcacheview/" class="md-nav__link">
  768. llama.native.llamakvcacheview
  769. </a>
  770. </li>
  771. <li class="md-nav__item">
  772. <a href="../xmldocs/llama.native.llamakvcacheviewcell/" class="md-nav__link">
  773. llama.native.llamakvcacheviewcell
  774. </a>
  775. </li>
  776. <li class="md-nav__item">
  777. <a href="../xmldocs/llama.native.llamakvcacheviewsafehandle/" class="md-nav__link">
  778. llama.native.llamakvcacheviewsafehandle
  779. </a>
  780. </li>
  781. <li class="md-nav__item">
  782. <a href="../xmldocs/llama.native.llamaloglevel/" class="md-nav__link">
  783. llama.native.llamaloglevel
  784. </a>
  785. </li>
  786. <li class="md-nav__item">
  787. <a href="../xmldocs/llama.native.llamamodelkvoverridetype/" class="md-nav__link">
  788. llama.native.llamamodelkvoverridetype
  789. </a>
  790. </li>
  791. <li class="md-nav__item">
  792. <a href="../xmldocs/llama.native.llamamodelmetadataoverride/" class="md-nav__link">
  793. llama.native.llamamodelmetadataoverride
  794. </a>
  795. </li>
  796. <li class="md-nav__item">
  797. <a href="../xmldocs/llama.native.llamamodelparams/" class="md-nav__link">
  798. llama.native.llamamodelparams
  799. </a>
  800. </li>
  801. <li class="md-nav__item">
  802. <a href="../xmldocs/llama.native.llamamodelquantizeparams/" class="md-nav__link">
  803. llama.native.llamamodelquantizeparams
  804. </a>
  805. </li>
  806. <li class="md-nav__item">
  807. <a href="../xmldocs/llama.native.llamanativebatch/" class="md-nav__link">
  808. llama.native.llamanativebatch
  809. </a>
  810. </li>
  811. <li class="md-nav__item">
  812. <a href="../xmldocs/llama.native.llamapoolingtype/" class="md-nav__link">
  813. llama.native.llamapoolingtype
  814. </a>
  815. </li>
  816. <li class="md-nav__item">
  817. <a href="../xmldocs/llama.native.llamapos/" class="md-nav__link">
  818. llama.native.llamapos
  819. </a>
  820. </li>
  821. <li class="md-nav__item">
  822. <a href="../xmldocs/llama.native.llamaropetype/" class="md-nav__link">
  823. llama.native.llamaropetype
  824. </a>
  825. </li>
  826. <li class="md-nav__item">
  827. <a href="../xmldocs/llama.native.llamaseqid/" class="md-nav__link">
  828. llama.native.llamaseqid
  829. </a>
  830. </li>
  831. <li class="md-nav__item">
  832. <a href="../xmldocs/llama.native.llamatoken/" class="md-nav__link">
  833. llama.native.llamatoken
  834. </a>
  835. </li>
  836. <li class="md-nav__item">
  837. <a href="../xmldocs/llama.native.llamatokendata/" class="md-nav__link">
  838. llama.native.llamatokendata
  839. </a>
  840. </li>
  841. <li class="md-nav__item">
  842. <a href="../xmldocs/llama.native.llamatokendataarray/" class="md-nav__link">
  843. llama.native.llamatokendataarray
  844. </a>
  845. </li>
  846. <li class="md-nav__item">
  847. <a href="../xmldocs/llama.native.llamatokendataarraynative/" class="md-nav__link">
  848. llama.native.llamatokendataarraynative
  849. </a>
  850. </li>
  851. <li class="md-nav__item">
  852. <a href="../xmldocs/llama.native.llamatokentype/" class="md-nav__link">
  853. llama.native.llamatokentype
  854. </a>
  855. </li>
  856. <li class="md-nav__item">
  857. <a href="../xmldocs/llama.native.llamavocabtype/" class="md-nav__link">
  858. llama.native.llamavocabtype
  859. </a>
  860. </li>
  861. <li class="md-nav__item">
  862. <a href="../xmldocs/llama.native.llavaimageembed/" class="md-nav__link">
  863. llama.native.llavaimageembed
  864. </a>
  865. </li>
  866. <li class="md-nav__item">
  867. <a href="../xmldocs/llama.native.nativeapi/" class="md-nav__link">
  868. llama.native.nativeapi
  869. </a>
  870. </li>
  871. <li class="md-nav__item">
  872. <a href="../xmldocs/llama.native.nativelibraryconfig/" class="md-nav__link">
  873. llama.native.nativelibraryconfig
  874. </a>
  875. </li>
  876. <li class="md-nav__item">
  877. <a href="../xmldocs/llama.native.ropescalingtype/" class="md-nav__link">
  878. llama.native.ropescalingtype
  879. </a>
  880. </li>
  881. <li class="md-nav__item">
  882. <a href="../xmldocs/llama.native.safellamacontexthandle/" class="md-nav__link">
  883. llama.native.safellamacontexthandle
  884. </a>
  885. </li>
  886. <li class="md-nav__item">
  887. <a href="../xmldocs/llama.native.safellamagrammarhandle/" class="md-nav__link">
  888. llama.native.safellamagrammarhandle
  889. </a>
  890. </li>
  891. <li class="md-nav__item">
  892. <a href="../xmldocs/llama.native.safellamahandlebase/" class="md-nav__link">
  893. llama.native.safellamahandlebase
  894. </a>
  895. </li>
  896. <li class="md-nav__item">
  897. <a href="../xmldocs/llama.native.safellamamodelhandle/" class="md-nav__link">
  898. llama.native.safellamamodelhandle
  899. </a>
  900. </li>
  901. <li class="md-nav__item">
  902. <a href="../xmldocs/llama.native.safellavaimageembedhandle/" class="md-nav__link">
  903. llama.native.safellavaimageembedhandle
  904. </a>
  905. </li>
  906. <li class="md-nav__item">
  907. <a href="../xmldocs/llama.native.safellavamodelhandle/" class="md-nav__link">
  908. llama.native.safellavamodelhandle
  909. </a>
  910. </li>
  911. <li class="md-nav__item">
  912. <a href="../xmldocs/llama.quantizer/" class="md-nav__link">
  913. llama.quantizer
  914. </a>
  915. </li>
  916. <li class="md-nav__item">
  917. <a href="../xmldocs/llama.sampling.basesamplingpipeline/" class="md-nav__link">
  918. llama.sampling.basesamplingpipeline
  919. </a>
  920. </li>
  921. <li class="md-nav__item">
  922. <a href="../xmldocs/llama.sampling.defaultsamplingpipeline/" class="md-nav__link">
  923. llama.sampling.defaultsamplingpipeline
  924. </a>
  925. </li>
  926. <li class="md-nav__item">
  927. <a href="../xmldocs/llama.sampling.greedysamplingpipeline/" class="md-nav__link">
  928. llama.sampling.greedysamplingpipeline
  929. </a>
  930. </li>
  931. <li class="md-nav__item">
  932. <a href="../xmldocs/llama.sampling.isamplingpipeline/" class="md-nav__link">
  933. llama.sampling.isamplingpipeline
  934. </a>
  935. </li>
  936. <li class="md-nav__item">
  937. <a href="../xmldocs/llama.sampling.isamplingpipelineextensions/" class="md-nav__link">
  938. llama.sampling.isamplingpipelineextensions
  939. </a>
  940. </li>
  941. <li class="md-nav__item">
  942. <a href="../xmldocs/llama.sampling.mirostate2samplingpipeline/" class="md-nav__link">
  943. llama.sampling.mirostate2samplingpipeline
  944. </a>
  945. </li>
  946. <li class="md-nav__item">
  947. <a href="../xmldocs/llama.sampling.mirostatesamplingpipeline/" class="md-nav__link">
  948. llama.sampling.mirostatesamplingpipeline
  949. </a>
  950. </li>
  951. <li class="md-nav__item">
  952. <a href="../xmldocs/llama.sessionstate/" class="md-nav__link">
  953. llama.sessionstate
  954. </a>
  955. </li>
  956. <li class="md-nav__item">
  957. <a href="../xmldocs/llama.streamingtokendecoder/" class="md-nav__link">
  958. llama.streamingtokendecoder
  959. </a>
  960. </li>
  961. <li class="md-nav__item">
  962. <a href="../xmldocs/llama.types.chatcompletion/" class="md-nav__link">
  963. llama.types.chatcompletion
  964. </a>
  965. </li>
  966. <li class="md-nav__item">
  967. <a href="../xmldocs/llama.types.chatcompletionchoice/" class="md-nav__link">
  968. llama.types.chatcompletionchoice
  969. </a>
  970. </li>
  971. <li class="md-nav__item">
  972. <a href="../xmldocs/llama.types.chatcompletionchunk/" class="md-nav__link">
  973. llama.types.chatcompletionchunk
  974. </a>
  975. </li>
  976. <li class="md-nav__item">
  977. <a href="../xmldocs/llama.types.chatcompletionchunkchoice/" class="md-nav__link">
  978. llama.types.chatcompletionchunkchoice
  979. </a>
  980. </li>
  981. <li class="md-nav__item">
  982. <a href="../xmldocs/llama.types.chatcompletionchunkdelta/" class="md-nav__link">
  983. llama.types.chatcompletionchunkdelta
  984. </a>
  985. </li>
  986. <li class="md-nav__item">
  987. <a href="../xmldocs/llama.types.chatcompletionmessage/" class="md-nav__link">
  988. llama.types.chatcompletionmessage
  989. </a>
  990. </li>
  991. <li class="md-nav__item">
  992. <a href="../xmldocs/llama.types.chatmessagerecord/" class="md-nav__link">
  993. llama.types.chatmessagerecord
  994. </a>
  995. </li>
  996. <li class="md-nav__item">
  997. <a href="../xmldocs/llama.types.chatrole/" class="md-nav__link">
  998. llama.types.chatrole
  999. </a>
  1000. </li>
  1001. <li class="md-nav__item">
  1002. <a href="../xmldocs/llama.types.completion/" class="md-nav__link">
  1003. llama.types.completion
  1004. </a>
  1005. </li>
  1006. <li class="md-nav__item">
  1007. <a href="../xmldocs/llama.types.completionchoice/" class="md-nav__link">
  1008. llama.types.completionchoice
  1009. </a>
  1010. </li>
  1011. <li class="md-nav__item">
  1012. <a href="../xmldocs/llama.types.completionchunk/" class="md-nav__link">
  1013. llama.types.completionchunk
  1014. </a>
  1015. </li>
  1016. <li class="md-nav__item">
  1017. <a href="../xmldocs/llama.types.completionlogprobs/" class="md-nav__link">
  1018. llama.types.completionlogprobs
  1019. </a>
  1020. </li>
  1021. <li class="md-nav__item">
  1022. <a href="../xmldocs/llama.types.completionusage/" class="md-nav__link">
  1023. llama.types.completionusage
  1024. </a>
  1025. </li>
  1026. <li class="md-nav__item">
  1027. <a href="../xmldocs/llama.types.embedding/" class="md-nav__link">
  1028. llama.types.embedding
  1029. </a>
  1030. </li>
  1031. <li class="md-nav__item">
  1032. <a href="../xmldocs/llama.types.embeddingdata/" class="md-nav__link">
  1033. llama.types.embeddingdata
  1034. </a>
  1035. </li>
  1036. <li class="md-nav__item">
  1037. <a href="../xmldocs/llama.types.embeddingusage/" class="md-nav__link">
  1038. llama.types.embeddingusage
  1039. </a>
  1040. </li>
  1041. <li class="md-nav__item">
  1042. <a href="../xmldocs/logger/" class="md-nav__link">
  1043. logger
  1044. </a>
  1045. </li>
  1046. </ul>
  1047. </nav>
  1048. </li>
  1049. </ul>
  1050. </nav>
  1051. </div>
  1052. </div>
  1053. </div>
  1054. <div class="md-sidebar md-sidebar--secondary" data-md-component="sidebar" data-md-type="toc" >
  1055. <div class="md-sidebar__scrollwrap">
  1056. <div class="md-sidebar__inner">
  1057. <nav class="md-nav md-nav--secondary" aria-label="Table of contents">
  1058. <label class="md-nav__title" for="__toc">
  1059. <span class="md-nav__icon md-icon"></span>
  1060. Table of contents
  1061. </label>
  1062. <ul class="md-nav__list" data-md-component="toc" data-md-scrollfix>
  1063. <li class="md-nav__item">
  1064. <a href="#why-gpu-is-not-used-when-i-have-installed-cuda" class="md-nav__link">
  1065. Why GPU is not used when I have installed CUDA
  1066. </a>
  1067. </li>
  1068. <li class="md-nav__item">
  1069. <a href="#why-the-inference-is-slow" class="md-nav__link">
  1070. Why the inference is slow
  1071. </a>
  1072. </li>
  1073. <li class="md-nav__item">
  1074. <a href="#why-the-program-crashes-before-any-output-is-generated" class="md-nav__link">
  1075. Why the program crashes before any output is generated
  1076. </a>
  1077. </li>
  1078. <li class="md-nav__item">
  1079. <a href="#why-my-model-is-generating-output-infinitely" class="md-nav__link">
  1080. Why my model is generating output infinitely
  1081. </a>
  1082. </li>
  1083. <li class="md-nav__item">
  1084. <a href="#how-to-run-llm-with-non-english-languages" class="md-nav__link">
  1085. How to run LLM with non-English languages
  1086. </a>
  1087. </li>
  1088. <li class="md-nav__item">
  1089. <a href="#pay-attention-to-the-length-of-prompt" class="md-nav__link">
  1090. Pay attention to the length of prompt
  1091. </a>
  1092. </li>
  1093. <li class="md-nav__item">
  1094. <a href="#choose-models-weight-depending-on-you-task" class="md-nav__link">
  1095. Choose models weight depending on you task
  1096. </a>
  1097. </li>
  1098. </ul>
  1099. </nav>
  1100. </div>
  1101. </div>
  1102. </div>
  1103. <div class="md-content" data-md-component="content">
  1104. <article class="md-content__inner md-typeset">
  1105. <h1 id="frequently-asked-qustions">Frequently asked qustions<a class="headerlink" href="#frequently-asked-qustions" title="Permanent link"></a></h1>
  1106. <p>Sometimes, your application with LLM and LLamaSharp may have unexpected behaviours. Here are some frequently asked questions, which may help you to deal with your problem.</p>
  1107. <h2 id="why-gpu-is-not-used-when-i-have-installed-cuda">Why GPU is not used when I have installed CUDA<a class="headerlink" href="#why-gpu-is-not-used-when-i-have-installed-cuda" title="Permanent link"></a></h2>
  1108. <ol>
  1109. <li>If you are using backend packages, please make sure you have installed the cuda backend package which matches the cuda version of your device. Please note that before LLamaSharp v0.10.0, only one backend package should be installed.</li>
  1110. <li>Add <code>NativeLibraryConfig.Instance.WithLogs(LLamaLogLevel.Info)</code> to the very beginning of your code. The log will show which native library file is loaded. If the CPU library is loaded, please try to compile the native library yourself and open an issue for that. If the CUDA libraty is loaded, please check if <code>GpuLayerCount &gt; 0</code> when loading the model weight.</li>
  1111. </ol>
  1112. <h2 id="why-the-inference-is-slow">Why the inference is slow<a class="headerlink" href="#why-the-inference-is-slow" title="Permanent link"></a></h2>
  1113. <p>Firstly, due to the large size of LLM models, it requires more time to generate outputs than other models, especially when you are using models larger than 30B.</p>
  1114. <p>To see if that's a LLamaSharp performance issue, please follow the two tips below.</p>
  1115. <ol>
  1116. <li>If you are using CUDA, Metal or OpenCL, please set <code>GpuLayerCount</code> as large as possible.</li>
  1117. <li>If it's still slower than you expect it to be, please try to run the same model with same setting in <a href="https://github.com/ggerganov/llama.cpp/tree/master/examples">llama.cpp examples</a>. If llama.cpp outperforms LLamaSharp significantly, it's likely a LLamaSharp BUG and please report us for that.</li>
  1118. </ol>
  1119. <h2 id="why-the-program-crashes-before-any-output-is-generated">Why the program crashes before any output is generated<a class="headerlink" href="#why-the-program-crashes-before-any-output-is-generated" title="Permanent link"></a></h2>
  1120. <p>Generally, there are two possible cases for this problem:</p>
  1121. <ol>
  1122. <li>The native library (backend) you are using is not compatible with the LLamaSharp version. If you compiled the native library yourself, please make sure you have checkouted llama.cpp to the corresponding commit of LLamaSharp, which could be found at the bottom of README.</li>
  1123. <li>The model file you are using is not compatible with the backend. If you are using a GGUF file downloaded from huggingface, please check its publishing time.</li>
  1124. </ol>
  1125. <h2 id="why-my-model-is-generating-output-infinitely">Why my model is generating output infinitely<a class="headerlink" href="#why-my-model-is-generating-output-infinitely" title="Permanent link"></a></h2>
  1126. <p>Please set anti-prompt or max-length when executing the inference.</p>
  1127. <p>Anti-prompt can also be called as "Stop-keyword", which decides when to stop the response generation. Under interactive mode, the maximum tokens count is always not set, which makes the LLM generates responses infinitively. Therefore, setting anti-prompt correctly helps a lot to avoid the strange behaviours. For example, the prompt file <code>chat-with-bob.txt</code> has the following content:</p>
  1128. <div class="highlight"><table class="highlighttable"><tr><td class="linenos"><div class="linenodiv"><pre><span></span><span class="normal">1</span>
  1129. <span class="normal">2</span>
  1130. <span class="normal">3</span>
  1131. <span class="normal">4</span>
  1132. <span class="normal">5</span>
  1133. <span class="normal">6</span>
  1134. <span class="normal">7</span></pre></div></td><td class="code"><div><pre><span></span><code>Transcript of a dialog, where the User interacts with an Assistant named Bob. Bob is helpful, kind, honest, good at writing, and never fails to answer the User&#39;s requests immediately and with precision.
  1135. User: Hello, Bob.
  1136. Bob: Hello. How may I help you today?
  1137. User: Please tell me the largest city in Europe.
  1138. Bob: Sure. The largest city in Europe is Moscow, the capital of Russia.
  1139. User:
  1140. </code></pre></div></td></tr></table></div>
  1141. <p>Therefore, the anti-prompt should be set as "User:". If the last line of the prompt is removed, LLM will automatically generate a question (user) and a response (bob) for one time when running the chat session. Therefore, the antiprompt is suggested to be appended to the prompt when starting a chat session.</p>
  1142. <p>What if an extra line is appended? The string "User:" in the prompt will be followed with a char "\n". Thus when running the model, the automatic generation of a pair of question and response may appear because the anti-prompt is "User:" but the last token is "User:\n". As for whether it will appear, it's an undefined behaviour, which depends on the implementation inside the <code>LLamaExecutor</code>. Anyway, since it may leads to unexpected behaviors, it's recommended to trim your prompt or carefully keep consistent with your anti-prompt.</p>
  1143. <h2 id="how-to-run-llm-with-non-english-languages">How to run LLM with non-English languages<a class="headerlink" href="#how-to-run-llm-with-non-english-languages" title="Permanent link"></a></h2>
  1144. <p>English is the most popular language in the world, and in the region of LLM. If you want to accept inputs and generate outputs of other languages, please follow the two tips below.</p>
  1145. <ol>
  1146. <li>Ensure the model you selected is well-trained with data of your language. For example, <a href="https://github.com/meta-llama/llama">LLaMA</a> (original) used few Chinese text during the pretrain, while <a href="https://github.com/ymcui/Chinese-LLaMA-Alpaca">Chinese-LLaMA-Alpaca</a> finetuned LLaMA with a large amount of Chinese text data. Therefore, the quality of the output of Chinese-LLaMA-Alpaca is much better than that of LLaMA.</li>
  1147. </ol>
  1148. <h2 id="pay-attention-to-the-length-of-prompt">Pay attention to the length of prompt<a class="headerlink" href="#pay-attention-to-the-length-of-prompt" title="Permanent link"></a></h2>
  1149. <p>Sometimes we want to input a long prompt to execute a task. However, the context size may limit the inference of LLama model. Please ensure the inequality below holds.</p>
  1150. <div class="arithmatex">\[ len(prompt) + len(response) &lt; len(context) \]</div>
  1151. <p>In this inequality, <code>len(response)</code> refers to the expected tokens for LLM to generate.</p>
  1152. <h2 id="choose-models-weight-depending-on-you-task">Choose models weight depending on you task<a class="headerlink" href="#choose-models-weight-depending-on-you-task" title="Permanent link"></a></h2>
  1153. <p>The differences between modes may lead to much different behaviours under the same task. For example, if you're building a chat bot with non-English, a fine-tuned model specially for the language you want to use will have huge effect on the performance.</p>
  1154. </article>
  1155. </div>
  1156. </div>
  1157. </main>
  1158. <footer class="md-footer">
  1159. <div class="md-footer-meta md-typeset">
  1160. <div class="md-footer-meta__inner md-grid">
  1161. <div class="md-copyright">
  1162. Made with
  1163. <a href="https://squidfunk.github.io/mkdocs-material/" target="_blank" rel="noopener">
  1164. Material for MkDocs
  1165. </a>
  1166. </div>
  1167. </div>
  1168. </div>
  1169. </footer>
  1170. </div>
  1171. <div class="md-dialog" data-md-component="dialog">
  1172. <div class="md-dialog__inner md-typeset"></div>
  1173. </div>
  1174. <script id="__config" type="application/json">{"base": "..", "features": ["content.action.edit", "navigation.instant"], "search": "../assets/javascripts/workers/search.74e28a9f.min.js", "translations": {"clipboard.copied": "Copied to clipboard", "clipboard.copy": "Copy to clipboard", "search.result.more.one": "1 more on this page", "search.result.more.other": "# more on this page", "search.result.none": "No matching documents", "search.result.one": "1 matching document", "search.result.other": "# matching documents", "search.result.placeholder": "Type to start searching", "search.result.term.missing": "Missing", "select.version": "Select version"}, "version": {"provider": "mike"}}</script>
  1175. <script src="../assets/javascripts/bundle.220ee61c.min.js"></script>
  1176. </body>
  1177. </html>

C#/.NET上易用的LLM高性能推理框架,支持LLaMA和LLaVA系列模型。

Contributors (1)