-
Notifications
You must be signed in to change notification settings - Fork 341
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Pulled conversion of a
IModelParams
into a LLamaContextParams
out…
… into an extension method which can be used in other places.
- Loading branch information
1 parent
f1111a9
commit f249937
Showing
2 changed files
with
63 additions
and
36 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,54 @@ | ||
using System.IO; | ||
using System; | ||
using System.Buffers; | ||
using LLama.Abstractions; | ||
using LLama.Native; | ||
|
||
namespace LLama.Extensions | ||
{ | ||
internal static class IModelParamsExtensions | ||
{ | ||
/// <summary> | ||
/// Convert the given `IModelParams` into a `LLamaContextParams` | ||
/// </summary> | ||
/// <param name="params"></param> | ||
/// <param name="result"></param> | ||
/// <returns></returns> | ||
/// <exception cref="FileNotFoundException"></exception> | ||
/// <exception cref="ArgumentException"></exception> | ||
public static MemoryHandle ToLlamaContextParams(this IModelParams @params, out LLamaContextParams result) | ||
{ | ||
if (!File.Exists(@params.ModelPath)) | ||
throw new FileNotFoundException($"The model file does not exist: {@params.ModelPath}"); | ||
|
||
if (@params.TensorSplits != null && @params.TensorSplits.Length != 1) | ||
throw new ArgumentException("Currently multi-gpu support is not supported by both llama.cpp and LLamaSharp."); | ||
|
||
result = NativeApi.llama_context_default_params(); | ||
result.n_ctx = @params.ContextSize; | ||
result.n_batch = @params.BatchSize; | ||
result.main_gpu = @params.MainGpu; | ||
result.n_gpu_layers = @params.GpuLayerCount; | ||
result.seed = @params.Seed; | ||
result.f16_kv = @params.UseFp16Memory; | ||
result.use_mmap = @params.UseMemoryLock; | ||
result.use_mlock = @params.UseMemoryLock; | ||
result.logits_all = @params.Perplexity; | ||
result.embedding = @params.EmbeddingMode; | ||
result.low_vram = @params.LowVram; | ||
result.n_gqa = @params.GroupedQueryAttention; | ||
result.rms_norm_eps = @params.RmsNormEpsilon; | ||
result.rope_freq_base = @params.RopeFrequencyBase; | ||
result.rope_freq_scale = @params.RopeFrequencyScale; | ||
result.mul_mat_q = @params.MulMatQ; | ||
|
||
var pin = @params.TensorSplits.AsMemory().Pin(); | ||
unsafe | ||
{ | ||
result.tensor_split = (nint)pin.Pointer; | ||
} | ||
|
||
return pin; | ||
} | ||
} | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters