C# client for interacting with KoboldCpp through its native and OpenAI-compatible endpoints.
- Complete support for KoboldCpp's native API
- OpenAI-compatible API endpoint support
- Streaming text generation
- Comprehensive configuration options
- Built-in error handling and logging
- Cross-platform compatibility
- Full async/await support
Install via NuGet:
dotnet add package SpongeEngine.KoboldSharp
using SpongeEngine.KoboldSharp.Client;
using SpongeEngine.KoboldSharp.Models;
// Configure the client
var options = new KoboldSharpOptions
{
BaseUrl = "http://localhost:5001",
UseGpu = true,
ContextSize = 2048
};
// Create client instance
using var client = new KoboldSharpClient(options);
// Generate completion
var request = new KoboldSharpRequest
{
Prompt = "Write a short story about a robot:",
MaxLength = 200,
Temperature = 0.7f,
TopP = 0.9f
};
var response = await client.GenerateAsync(request);
Console.WriteLine(response.Results[0].Text);
// Stream completion
await foreach (var token in client.GenerateStreamAsync(request))
{
Console.Write(token);
}
var options = new KoboldSharpOptions
{
BaseUrl = "http://localhost:5001",
UseOpenAiApi = true
};
using var client = new KoboldSharpClient(options);
// Simple completion
string response = await client.CompleteAsync(
"Write a short story about:",
new CompletionOptions
{
MaxTokens = 200,
Temperature = 0.7f,
TopP = 0.9f
});
// Stream completion
await foreach (var token in client.StreamCompletionAsync(
"Once upon a time...",
new CompletionOptions { MaxTokens = 200 }))
{
Console.Write(token);
}
var options = new KoboldSharpOptions
{
BaseUrl = "http://localhost:5001", // KoboldCpp server URL
ApiKey = "optional_api_key", // Optional API key
TimeoutSeconds = 600, // Request timeout
ContextSize = 2048, // Maximum context size
UseGpu = true, // Enable GPU acceleration
UseOpenAiApi = false // Use OpenAI-compatible API
};
var request = new KoboldSharpRequest
{
Prompt = "Your prompt here",
MaxLength = 200, // Maximum tokens to generate
MaxContextLength = 2048, // Maximum context length
Temperature = 0.7f, // Randomness (0.0-1.0)
TopP = 0.9f, // Nucleus sampling threshold
TopK = 40, // Top-K sampling
TopA = 0.0f, // Top-A sampling
Typical = 1.0f, // Typical sampling
Tfs = 1.0f, // Tail-free sampling
RepetitionPenalty = 1.1f, // Repetition penalty
RepetitionPenaltyRange = 64, // Penalty range
StopSequences = new List<string> { "\n" }, // Stop sequences
Stream = false, // Enable streaming
TrimStop = true, // Trim stop sequences
MirostatMode = 0, // Mirostat sampling mode
MirostatTau = 5.0f, // Mirostat target entropy
MirostatEta = 0.1f // Mirostat learning rate
};
try
{
var response = await client.GenerateAsync(request);
}
catch (KoboldSharpException ex)
{
Console.WriteLine($"KoboldCpp error: {ex.Message}");
Console.WriteLine($"Provider: {ex.Provider}");
if (ex.StatusCode.HasValue)
{
Console.WriteLine($"Status code: {ex.StatusCode}");
}
if (ex.ResponseContent != null)
{
Console.WriteLine($"Response content: {ex.ResponseContent}");
}
}
catch (Exception ex)
{
Console.WriteLine($"General error: {ex.Message}");
}
The client supports Microsoft.Extensions.Logging:
ILogger logger = LoggerFactory
.Create(builder => builder
.AddConsole()
.SetMinimumLevel(LogLevel.Debug))
.CreateLogger<KoboldSharpClient>();
var client = new KoboldSharpClient(options, logger);
Custom JSON settings can be provided:
var jsonSettings = new JsonSerializerSettings
{
NullValueHandling = NullValueHandling.Ignore,
DefaultValueHandling = DefaultValueHandling.Ignore
};
var client = new KoboldSharpClient(options, jsonSettings: jsonSettings);
The library includes both unit and integration tests. Integration tests require a running KoboldCpp server.
To run the tests:
dotnet test
To configure the test environment:
// Set environment variables for testing
Environment.SetEnvironmentVariable("KOBOLDCPP_BASE_URL", "http://localhost:5001");
Environment.SetEnvironmentVariable("KOBOLDCPP_OPENAI_BASE_URL", "http://localhost:5001/v1");
This project is licensed under the MIT License - see the LICENSE file for details.
Contributions are welcome! Please feel free to submit a Pull Request.
For issues and feature requests, please use the GitHub issues page.