managedcode
diff --git a/‎native/include/mlxsharp/api.h‎
Lines changed: 0 additions & 27 deletions b/‎native/include/mlxsharp/api.h‎
Lines changed: 0 additions & 27 deletions
diff --git a/‎native/src/mlxsharp.cpp‎
Lines changed: 0 additions & 101 deletions b/‎native/src/mlxsharp.cpp‎
Lines changed: 0 additions & 101 deletions
diff --git a/‎src/MLXSharp.Tests/ModelIntegrationTests.cs‎
Lines changed: 21 additions & 4 deletions b/‎src/MLXSharp.Tests/ModelIntegrationTests.cs‎
Lines changed: 21 additions & 4 deletions
diff --git a/‎src/MLXSharp.Tests/TestEnvironment.cs‎
Lines changed: 55 additions & 16 deletions b/‎src/MLXSharp.Tests/TestEnvironment.cs‎
Lines changed: 55 additions & 16 deletions
diff --git a/‎src/MLXSharp.Tests/TokenizerSmokeTests.cs‎
Lines changed: 0 additions & 37 deletions b/‎src/MLXSharp.Tests/TokenizerSmokeTests.cs‎
Lines changed: 0 additions & 37 deletions
@@ -137,18 +137,6 @@ typedef struct mlx_usage {
     int output_tokens;
 } mlx_usage;
 
-typedef struct mlxsharp_generation_options {
-    int max_tokens;
-    float temperature;
-    float top_p;
-    int top_k;
-} mlxsharp_generation_options;
-
-typedef struct mlxsharp_token_buffer {
-    int32_t* tokens;
-    size_t length;
-} mlxsharp_token_buffer;
-
 int mlxsharp_create_session(
     const char* chat_model_id,
     const char* embedding_model_id,
@@ -183,21 +171,6 @@ void mlxsharp_free_buffer(unsigned char* buffer);
 
 void mlxsharp_release_session(void* session);
 
-int mlxsharp_session_load_model(
-    void* session,
-    const char* model_directory,
-    const char* tokenizer_path);
-
-int mlxsharp_session_generate_tokens(
-    void* session,
-    const int32_t* prompt_tokens,
-    size_t prompt_token_count,
-    const mlxsharp_generation_options* options,
-    mlxsharp_token_buffer* output_tokens,
-    mlx_usage* usage);
-
-void mlxsharp_release_tokens(mlxsharp_token_buffer* buffer);
-
 #ifdef __cplusplus
 }
 #endif
@@ -1,5 +1,4 @@
 #include "mlxsharp/api.h"
-#include "mlxsharp/llm_model_runner.h"
 
 #include <algorithm>
 #include <atomic>
@@ -44,8 +43,6 @@ struct mlxsharp_session {
     std::string chat_model;
     std::string embedding_model;
     std::string image_model;
-    std::unique_ptr<mlxsharp::llm::ModelRunner> model_runner;
-
     mlxsharp_session(mlxsharp_context_t* ctx, std::string chat, std::string embed, std::string image)
         : context(ctx),
           chat_model(std::move(chat)),
@@ -565,104 +562,6 @@ void mlxsharp_free_buffer(unsigned char* data) {
     std::free(data);
 }
 
-int mlxsharp_session_load_model(
-    void* session_ptr,
-    const char* model_directory,
-    const char* tokenizer_path) {
-    if (session_ptr == nullptr) {
-        return set_error(MLXSHARP_STATUS_INVALID_ARGUMENT, "Session pointer is null.");
-    }
-
-    if (model_directory == nullptr || tokenizer_path == nullptr) {
-        return set_error(MLXSHARP_STATUS_INVALID_ARGUMENT, "Model directory or tokenizer path is null.");
-    }
-
-    auto* session = static_cast<mlxsharp_session_t*>(session_ptr);
-
-    return invoke([&]() -> int {
-        auto model = mlxsharp::llm::ModelRunner::Create(model_directory, tokenizer_path);
-        session->model_runner = std::move(model);
-        return MLXSHARP_STATUS_SUCCESS;
-    });
-}
-
-int mlxsharp_session_generate_tokens(
-    void* session_ptr,
-    const int32_t* prompt_tokens,
-    size_t prompt_token_count,
-    const mlxsharp_generation_options* options,
-    mlxsharp_token_buffer* output_tokens,
-    mlx_usage* usage) {
-    if (session_ptr == nullptr) {
-        return set_error(MLXSHARP_STATUS_INVALID_ARGUMENT, "Session pointer is null.");
-    }
-
-    if (output_tokens == nullptr) {
-        return set_error(MLXSHARP_STATUS_INVALID_ARGUMENT, kNullOutParameter);
-    }
-
-    output_tokens->tokens = nullptr;
-    output_tokens->length = 0;
-
-    auto* session = static_cast<mlxsharp_session_t*>(session_ptr);
-
-    if (session->model_runner == nullptr) {
-        return set_error(MLXSHARP_STATUS_INVALID_ARGUMENT, "Model is not loaded. Call mlxsharp_session_load_model first.");
-    }
-
-    if (prompt_token_count > 0 && prompt_tokens == nullptr) {
-        return set_error(MLXSHARP_STATUS_INVALID_ARGUMENT, "Prompt tokens pointer is null.");
-    }
-
-    if (options == nullptr) {
-        return set_error(MLXSHARP_STATUS_INVALID_ARGUMENT, "Generation options pointer is null.");
-    }
-
-    return invoke([&]() -> int {
-        std::vector<int32_t> prompt;
-        prompt.reserve(prompt_token_count);
-        for (size_t i = 0; i < prompt_token_count; ++i) {
-            prompt.push_back(prompt_tokens[i]);
-        }
-
-        mlxsharp::llm::GenerationOptions native_options{
-            options->max_tokens,
-            options->temperature,
-            options->top_p,
-            options->top_k,
-        };
-
-        auto generated = session->model_runner->Generate(prompt, native_options);
-        output_tokens->length = generated.size();
-
-        if (generated.empty()) {
-            assign_usage(usage, static_cast<int>(prompt_token_count), 0);
-            return MLXSHARP_STATUS_SUCCESS;
-        }
-
-        auto* buffer = static_cast<int32_t*>(std::malloc(generated.size() * sizeof(int32_t)));
-        if (buffer == nullptr) {
-            return set_error(MLXSHARP_STATUS_OUT_OF_MEMORY, "Failed to allocate output token buffer.");
-        }
-
-        std::memcpy(buffer, generated.data(), generated.size() * sizeof(int32_t));
-        output_tokens->tokens = buffer;
-
-        assign_usage(usage, static_cast<int>(prompt_token_count), static_cast<int>(generated.size()));
-        return MLXSHARP_STATUS_SUCCESS;
-    });
-}
-
-void mlxsharp_release_tokens(mlxsharp_token_buffer* buffer) {
-    if (buffer == nullptr || buffer->tokens == nullptr) {
-        return;
-    }
-
-    std::free(buffer->tokens);
-    buffer->tokens = nullptr;
-    buffer->length = 0;
-}
-
 void mlxsharp_release_session(void* session_ptr) {
     if (session_ptr == nullptr) {
         return;
 
@@ -5,7 +5,6 @@
 using MLXSharp;
 using MLXSharp.Backends;
 using Xunit;
-using Xunit.Sdk;
 
 namespace MLXSharp.Tests;
 
@@ -24,7 +23,7 @@ public async Task NativeBackendAnswersSimpleMathAsync()
             new[] { new ChatMessage(ChatRole.User, "Скільки буде 2+2?") },
             new ChatOptions { Temperature = 0 });
 
-        var result = await backend.GenerateTextAsync(request, CancellationToken.None).ConfigureAwait(false);
+        var result = await backend.GenerateTextAsync(request, CancellationToken.None);
 
         Assert.False(string.IsNullOrWhiteSpace(result.Text));
         Assert.Contains("4", result.Text);
@@ -39,6 +38,24 @@ private static MlxClientOptions CreateOptions()
             EnableNativeModelRunner = false,
         };
 
+        var modelId = Environment.GetEnvironmentVariable("MLXSHARP_HF_MODEL_ID");
+        if (!string.IsNullOrWhiteSpace(modelId))
+        {
+            options.ChatModelId = modelId;
+        }
+
+        var modelDirectory = Environment.GetEnvironmentVariable("MLXSHARP_MODEL_PATH");
+        if (!string.IsNullOrWhiteSpace(modelDirectory))
+        {
+            options.NativeModelDirectory = modelDirectory;
+        }
+
+        var tokenizerPath = Environment.GetEnvironmentVariable("MLXSHARP_TOKENIZER_PATH");
+        if (!string.IsNullOrWhiteSpace(tokenizerPath))
+        {
+            options.TokenizerPath = tokenizerPath;
+        }
+
         return options;
     }
 
@@ -47,13 +64,13 @@ private static void EnsureAssetsOrSkip()
         var modelPath = Environment.GetEnvironmentVariable("MLXSHARP_MODEL_PATH");
         if (string.IsNullOrWhiteSpace(modelPath) || !System.IO.Directory.Exists(modelPath))
         {
-            throw new SkipException("Native model bundle not found.");
+            Skip.If(true, "Native model bundle not found.");
         }
 
         var library = Environment.GetEnvironmentVariable("MLXSHARP_LIBRARY");
         if (string.IsNullOrWhiteSpace(library) || !System.IO.File.Exists(library))
         {
-            throw new SkipException("Native libmlxsharp library not configured.");
+            Skip.If(true, "Native libmlxsharp library not configured.");
         }
     }
 }
@@ -25,38 +25,40 @@ public static void EnsureInitialized()
 
     private static void ConfigureNativeLibrary(string repoRoot)
     {
-        if (!string.IsNullOrWhiteSpace(Environment.GetEnvironmentVariable("MLXSHARP_LIBRARY")))
+        var existing = Environment.GetEnvironmentVariable("MLXSHARP_LIBRARY");
+        if (!string.IsNullOrWhiteSpace(existing) && File.Exists(existing))
         {
+            ApplyNativeLibrary(existing);
             return;
         }
 
         string? libraryPath = null;
         if (RuntimeInformation.IsOSPlatform(OSPlatform.OSX))
         {
-            var candidate = Path.Combine(repoRoot, "libs", "native-osx-arm64", "libmlxsharp.dylib");
-            if (File.Exists(candidate))
+            var candidates = new[]
             {
-                libraryPath = candidate;
-            }
+                Path.Combine(repoRoot, "libs", "native-osx-arm64", "libmlxsharp.dylib"),
+                Path.Combine(repoRoot, "libs", "native-libs", "libmlxsharp.dylib"),
+                Path.Combine(repoRoot, "libs", "native-libs", "osx-arm64", "libmlxsharp.dylib"),
+            };
+
+            libraryPath = Array.Find(candidates, File.Exists);
         }
         else if (RuntimeInformation.IsOSPlatform(OSPlatform.Linux))
         {
-            var candidate = Path.Combine(repoRoot, "libs", "native-libs", "libmlxsharp.so");
-            if (File.Exists(candidate))
+            var candidates = new[]
             {
-                libraryPath = candidate;
-            }
+                Path.Combine(repoRoot, "libs", "native-linux", "libmlxsharp.so"),
+                Path.Combine(repoRoot, "libs", "native-libs", "libmlxsharp.so"),
+                Path.Combine(repoRoot, "libs", "native-libs", "linux-x64", "libmlxsharp.so"),
+            };
+
+            libraryPath = Array.Find(candidates, File.Exists);
         }
 
         if (!string.IsNullOrWhiteSpace(libraryPath))
         {
-            Environment.SetEnvironmentVariable("MLXSHARP_LIBRARY", libraryPath);
-
-            var metalPath = Path.Combine(Path.GetDirectoryName(libraryPath)!, "mlx.metallib");
-            if (File.Exists(metalPath))
-            {
-                Environment.SetEnvironmentVariable("MLX_METAL_PATH", metalPath);
-            }
+            ApplyNativeLibrary(libraryPath);
         }
     }
 
@@ -77,4 +79,41 @@ private static void ConfigureModelPaths(string repoRoot)
             Environment.SetEnvironmentVariable("MLXSHARP_TOKENIZER_PATH", tokenizerPath);
         }
     }
+
+    private static void ApplyNativeLibrary(string libraryPath)
+    {
+        Environment.SetEnvironmentVariable("MLXSHARP_LIBRARY", libraryPath);
+
+        var metalPath = Path.Combine(Path.GetDirectoryName(libraryPath)!, "mlx.metallib");
+        if (File.Exists(metalPath))
+        {
+            Environment.SetEnvironmentVariable("MLX_METAL_PATH", metalPath);
+            Environment.SetEnvironmentVariable("MLX_METALLIB", metalPath);
+        }
+
+        var fileName = RuntimeInformation.IsOSPlatform(OSPlatform.OSX)
+            ? "libmlxsharp.dylib"
+            : RuntimeInformation.IsOSPlatform(OSPlatform.Linux)
+                ? "libmlxsharp.so"
+                : "libmlxsharp";
+
+        TryCopy(libraryPath, Path.Combine(AppContext.BaseDirectory, fileName));
+        if (File.Exists(metalPath))
+        {
+            TryCopy(metalPath, Path.Combine(AppContext.BaseDirectory, "mlx.metallib"));
+        }
+    }
+
+    private static void TryCopy(string source, string destination)
+    {
+        try
+        {
+            Directory.CreateDirectory(Path.GetDirectoryName(destination)!);
+            File.Copy(source, destination, overwrite: true);
+        }
+        catch
+        {
+            // best effort copy; ignore IO errors
+        }
+    }
 }