diff --git a/LLama/Abstractions/IModelParams.cs b/LLama/Abstractions/IModelParams.cs
index a8b87acc..ad0608d7 100644
--- a/LLama/Abstractions/IModelParams.cs
+++ b/LLama/Abstractions/IModelParams.cs
@@ -77,11 +77,6 @@ namespace LLama.Abstractions
///
int BatchSize { get; set; }
- ///
- /// Whether to convert eos to newline during the inference.
- ///
- bool ConvertEosToNewLine { get; set; }
-
///
/// Whether to use embedding mode. (embedding) Note that if this is set to true,
/// The LLamaModel won't produce text response anymore.
diff --git a/LLama/Common/ModelParams.cs b/LLama/Common/ModelParams.cs
index f5c98fae..1ce18dd8 100644
--- a/LLama/Common/ModelParams.cs
+++ b/LLama/Common/ModelParams.cs
@@ -69,11 +69,6 @@ namespace LLama.Common
///
public int BatchSize { get; set; } = 512;
- ///
- /// Whether to convert eos to newline during the inference.
- ///
- public bool ConvertEosToNewLine { get; set; } = false;
-
///
/// Whether to use embedding mode. (embedding) Note that if this is set to true,
/// The LLamaModel won't produce text response anymore.
@@ -137,7 +132,6 @@ namespace LLama.Common
/// Base model path for the lora adapter (lora_base)
/// Number of threads (-1 = autodetect) (n_threads)
/// Batch size for prompt processing (must be >=32 to use BLAS) (n_batch)
- /// Whether to convert eos to newline during the inference.
/// Whether to use embedding mode. (embedding) Note that if this is set to true, The LLamaModel won't produce text response anymore.
/// RoPE base frequency.
/// RoPE frequency scaling factor
@@ -148,7 +142,7 @@ namespace LLama.Common
int seed = 1337, bool useFp16Memory = true,
bool useMemorymap = true, bool useMemoryLock = false, bool perplexity = false,
string loraAdapter = "", string loraBase = "", int threads = -1, int batchSize = 512,
- bool convertEosToNewLine = false, bool embeddingMode = false,
+ bool embeddingMode = false,
float ropeFrequencyBase = 10000.0f, float ropeFrequencyScale = 1f, bool mulMatQ = false,
string encoding = "UTF-8")
{
@@ -164,7 +158,6 @@ namespace LLama.Common
LoraBase = loraBase;
Threads = threads == -1 ? Math.Max(Environment.ProcessorCount / 2, 1) : threads;
BatchSize = batchSize;
- ConvertEosToNewLine = convertEosToNewLine;
EmbeddingMode = embeddingMode;
RopeFrequencyBase = ropeFrequencyBase;
RopeFrequencyScale = ropeFrequencyScale;