scisharp
/
LLamaSharp

using System.Text;
using LLama.Abstractions;
using LLama.Native;

namespace LLama.Web.Common;

public class ModelOptions
    : ILLamaParams
{
    /// <summary>
    /// Model friendly name
    /// </summary>
    public string Name { get; set; }

    /// <summary>
    /// Max context instances allowed per model
    /// </summary>
    public int MaxInstances { get; set; }

    /// <inheritdoc />
    public uint? ContextSize { get; set; }

    /// <inheritdoc />
    public int MainGpu { get; set; } = 0;

    /// <inheritdoc />
    public GPUSplitMode SplitMode { get; set; } = GPUSplitMode.None;

    /// <inheritdoc />
    public int GpuLayerCount { get; set; } = 20;

    public uint SeqMax { get; }

    /// <inheritdoc />
    public uint Seed { get; set; } = 1686349486;

    public bool Embeddings { get; }

    /// <inheritdoc />
    public bool UseMemorymap { get; set; } = true;

    /// <inheritdoc />
    public bool UseMemoryLock { get; set; } = false;

    /// <inheritdoc />
    public string ModelPath { get; set; }

    /// <inheritdoc />
    public AdapterCollection LoraAdapters { get; set; } = new();

    /// <inheritdoc />
    public string LoraBase { get; set; } = string.Empty;

    /// <inheritdoc />
    public uint? Threads { get; set; }

    /// <inheritdoc />
    public uint? BatchThreads { get; set; }

    /// <inheritdoc />
    public uint BatchSize { get; set; } = 512;

    /// <inheritdoc />
    public uint UBatchSize { get; set; } = 512;

    /// <inheritdoc />
    public TensorSplitsCollection TensorSplits { get; set; } = new();

    /// <inheritdoc />
    public List<MetadataOverride> MetadataOverrides { get; } = new();

    /// <inheritdoc />
    public float? RopeFrequencyBase { get; set; }

    /// <inheritdoc />
    public float? RopeFrequencyScale { get; set; }

    /// <inheritdoc />
    public float? YarnExtrapolationFactor { get; set; }

    /// <inheritdoc />
    public float? YarnAttentionFactor { get; set; }

    /// <inheritdoc />
    public float? YarnBetaFast { get; set; }

    /// <inheritdoc />
    public float? YarnBetaSlow { get; set; }

    /// <inheritdoc />
    public uint? YarnOriginalContext { get; set; }

    /// <inheritdoc />
    public RopeScalingType? YarnScalingType { get; set; }

    /// <inheritdoc />
    public GGMLType? TypeK { get; set; }

    /// <inheritdoc />
    public GGMLType? TypeV { get; set; }

    /// <inheritdoc />
    public bool NoKqvOffload { get; set; }

    /// <inheritdoc />
    public Encoding Encoding { get; set; } = Encoding.UTF8;

    /// <inheritdoc />
    public bool VocabOnly { get; set; }

    /// <inheritdoc />
    public float DefragThreshold { get; set; }

    /// <inheritdoc />
    public LLamaPoolingType PoolingType { get; set; }
}