NexaAI
diff --git a/‎.gitignore‎
Lines changed: 7 additions & 1 deletion b/‎.gitignore‎
Lines changed: 7 additions & 1 deletion
diff --git a/‎Package.resolved‎
Lines changed: 14 additions & 0 deletions b/‎Package.resolved‎
Lines changed: 14 additions & 0 deletions
diff --git a/‎Package.swift‎
Lines changed: 42 additions & 0 deletions b/‎Package.swift‎
Lines changed: 42 additions & 0 deletions
diff --git a/‎bindings/ios/NexaAI/Package.resolved‎
Lines changed: 14 additions & 0 deletions b/‎bindings/ios/NexaAI/Package.resolved‎
Lines changed: 14 additions & 0 deletions
diff --git a/‎bindings/ios/NexaAI/Package.swift‎
Lines changed: 42 additions & 0 deletions b/‎bindings/ios/NexaAI/Package.swift‎
Lines changed: 42 additions & 0 deletions
diff --git a/‎bindings/ios/NexaAI/Sources/NexaAI/Data/ChatMessage.swift‎
Lines changed: 26 additions & 0 deletions b/‎bindings/ios/NexaAI/Sources/NexaAI/Data/ChatMessage.swift‎
Lines changed: 26 additions & 0 deletions
diff --git a/‎bindings/ios/NexaAI/Sources/NexaAI/Data/EmbeddingConfig.swift‎
Lines changed: 24 additions & 0 deletions b/‎bindings/ios/NexaAI/Sources/NexaAI/Data/EmbeddingConfig.swift‎
Lines changed: 24 additions & 0 deletions
diff --git a/‎bindings/ios/NexaAI/Sources/NexaAI/Data/GenerationConfig.swift‎
Lines changed: 45 additions & 0 deletions b/‎bindings/ios/NexaAI/Sources/NexaAI/Data/GenerationConfig.swift‎
Lines changed: 45 additions & 0 deletions
diff --git a/‎bindings/ios/NexaAI/Sources/NexaAI/Data/ModelConfig.swift‎
Lines changed: 69 additions & 0 deletions b/‎bindings/ios/NexaAI/Sources/NexaAI/Data/ModelConfig.swift‎
Lines changed: 69 additions & 0 deletions
diff --git a/‎bindings/ios/NexaAI/Sources/NexaAI/Data/ProfileData.swift‎
Lines changed: 88 additions & 0 deletions b/‎bindings/ios/NexaAI/Sources/NexaAI/Data/ProfileData.swift‎
Lines changed: 88 additions & 0 deletions
@@ -71,4 +71,10 @@ tmp/
 __debug_bin
 
 # TLS certificates
-*.pem
+*.pem
+/.swiftpm
+/bindings/ios/Example/Example.xcodeproj/project.xcworkspace/xcuserdata
+/bindings/ios/NexaAI/.swiftpm
+/.build
+/bindings/ios/Example/Example.xcodeproj/project.xcworkspace/xcshareddata
+/bindings/ios/Example/Example.xcodeproj/xcuserdata
@@ -0,0 +1,42 @@
+// swift-tools-version: 5.9
+// The swift-tools-version declares the minimum version of Swift required to build this package.
+import PackageDescription
+
+let package = Package(
+    name: "NexaAI",
+    platforms: [
+        .macOS(.v14), .iOS(.v17),
+    ],
+    products: [
+        .library(name: "NexaAI", targets: ["NexaAI"])
+    ],
+    dependencies: [
+        .package(url: "git@github.com:NexaAI/nexasdk-mobile-iOS-framework.git", branch: "main")
+    ],
+    targets: [
+        // Targets are the basic building blocks of a package, defining a module or a test suite.
+        // Targets can depend on other targets in this package and products from dependencies.
+        .target(
+            name: "NexaAI",
+            dependencies: [
+                .product(name: "NexaBridge", package: "nexasdk-mobile-iOS-framework"),
+                .product(name: "LlamaPlugin", package: "nexasdk-mobile-iOS-framework"),
+                .product(name: "llama", package: "nexasdk-mobile-iOS-framework"),
+                .product(name: "common", package: "nexasdk-mobile-iOS-framework"),
+                .product(name: "mtmd", package: "nexasdk-mobile-iOS-framework"),
+                .product(name: "ggml", package: "nexasdk-mobile-iOS-framework"),
+                .product(name: "ggml-base", package: "nexasdk-mobile-iOS-framework"),
+                .product(name: "ggml-cpu", package: "nexasdk-mobile-iOS-framework"),
+                .product(name: "ggml-metal", package: "nexasdk-mobile-iOS-framework")
+            ],
+            path: "bindings/ios/NexaAI/Sources",
+            swiftSettings: [.interoperabilityMode(.Cxx)]
+        ),
+        .testTarget(
+            name: "NexaAITests",
+            dependencies: ["NexaAI"],
+            path: "bindings/ios/NexaAI/Tests",
+            swiftSettings: [.interoperabilityMode(.Cxx)],
+        ),
+    ]
+)
@@ -0,0 +1,42 @@
+// swift-tools-version: 5.9
+// The swift-tools-version declares the minimum version of Swift required to build this package.
+
+import PackageDescription
+
+let package = Package(
+    name: "NexaAI",
+    platforms: [.iOS(.v17), .macOS(.v14)],
+    products: [
+        // Products define the executables and libraries a package produces, making them visible to other packages.
+        .library(name: "NexaAI", targets: ["NexaAI"]),
+    ],
+
+    dependencies: [
+        .package(url: "git@github.com:NexaAI/nexasdk-mobile-iOS-framework.git", branch: "main")
+    ],
+    
+    targets: [
+        // Targets are the basic building blocks of a package, defining a module or a test suite.
+        // Targets can depend on other targets in this package and products from dependencies.
+        .target(
+            name: "NexaAI",
+            dependencies: [
+                .product(name: "NexaBridge", package: "nexasdk-mobile-iOS-framework"),
+                .product(name: "LlamaPlugin", package: "nexasdk-mobile-iOS-framework"),
+                .product(name: "llama", package: "nexasdk-mobile-iOS-framework"),
+                .product(name: "common", package: "nexasdk-mobile-iOS-framework"),
+                .product(name: "mtmd", package: "nexasdk-mobile-iOS-framework"),
+                .product(name: "ggml", package: "nexasdk-mobile-iOS-framework"),
+                .product(name: "ggml-base", package: "nexasdk-mobile-iOS-framework"),
+                .product(name: "ggml-cpu", package: "nexasdk-mobile-iOS-framework"),
+                .product(name: "ggml-metal", package: "nexasdk-mobile-iOS-framework")
+            ],
+            swiftSettings: [.interoperabilityMode(.Cxx)],
+        ),
+        .testTarget(
+            name: "NexaAITests",
+            dependencies: ["NexaAI"],
+            swiftSettings: [.interoperabilityMode(.Cxx)],
+        ),
+    ]
+)
@@ -0,0 +1,26 @@
+import Foundation
+
+public struct ChatMessage {
+    public var role: Role
+    public var content: String
+    public var images: [String]
+    public var audios: [String]
+
+    public init(
+        role: Role,
+        content: String,
+        images: [String] = [],
+        audios: [String] = []
+    ) {
+        self.role = role
+        self.content = content
+        self.images = images
+        self.audios = audios
+    }
+}
+
+public enum Role: String {
+    case user
+    case assistant
+    case system
+}
@@ -0,0 +1,24 @@
+
+import Foundation
+
+public struct EmbeddingConfig {
+
+    public var batchSize: Int32
+    public var normalize: Bool
+    public var normalizeMethod: NormalizeMethod
+
+    public init(batchSize: Int32, normalize: Bool, normalizeMethod: NormalizeMethod) {
+        self.batchSize = batchSize
+        self.normalize = normalize
+        self.normalizeMethod = normalizeMethod
+    }
+}
+
+public extension EmbeddingConfig {
+
+    enum NormalizeMethod: String {
+        case l2
+        case mean
+        case none
+    }
+}
@@ -0,0 +1,45 @@
+import Foundation
+
+/*
+LLM / VLM generation configuration (IMPROVED: support multiple images and audios)
+ typedef struct {
+     int32_t           max_tokens;     /* Maximum tokens to generate */
+     const char**      stop;           /* Array of stop sequences */
+     int32_t           stop_count;     /* Number of stop sequences */
+     int32_t           n_past;         /* Number of past tokens to consider */
+     ml_SamplerConfig* sampler_config; /* Advanced sampling config */
+     // --- Improved multimodal support ---
+     ml_Path* image_paths; /* Array of image paths for VLM (NULL if none) */
+     int32_t  image_count; /* Number of images */
+     ml_Path* audio_paths; /* Array of audio paths for VLM (NULL if none) */
+     int32_t  audio_count; /* Number of audios */
+ } ml_GenerationConfig;
+*/
+
+/// LLM / VLM generation configuration
+public struct GenerationConfig: Codable {
+    public var maxTokens: Int32                 // Maximum tokens to generate
+    public var stop: [String]                   // Array of stop sequences
+    public var nPast: Int32                     // Number of past tokens to consider
+    public var samplerConfig: SamplerConfig     // Advanced sampling config
+    public var imagePaths: [String]            // Array of image paths for VLM
+    public var audioPaths: [String]            // Array of audio paths for VLM
+
+    public init(
+        maxTokens: Int32 = 1024,
+        stop: [String] = [],
+        nPast: Int32 = 0,
+        samplerConfig: SamplerConfig = .default,
+        imagePaths: [String] = [],
+        audioPaths: [String] = []
+    ) {
+        self.maxTokens = maxTokens
+        self.stop = stop
+        self.nPast = nPast
+        self.samplerConfig = samplerConfig
+        self.imagePaths = imagePaths
+        self.audioPaths = audioPaths
+    }
+
+    public static let `default` = GenerationConfig()
+}
@@ -0,0 +1,69 @@
+import NexaBridge
+
+/** LLM / VLM model configuration */
+/*
+ typedef struct {
+    int32_t     n_ctx;                  // text context, 0 = from model
+    int32_t     n_threads;              // number of threads to use for generation
+    int32_t     n_threads_batch;        // number of threads to use for batch processing
+    int32_t     n_batch;                // logical maximum batch size that can be submitted to llama_decode
+    int32_t     n_ubatch;               // physical maximum batch size
+    int32_t     n_seq_max;              // max number of sequences (i.e. distinct states for recurrent models)
+    ml_Path     chat_template_path;     // path to chat template file, optional
+    const char* chat_template_content;  // content of chat template file, optional
+    // For QNN
+    ml_Path system_library_path;    /* System library path */
+    ml_Path backend_library_path;   /* Backend library path */
+    ml_Path extension_library_path; /* Extension library path */
+    ml_Path config_file_path;       /* Config file path */
+    ml_Path embedded_tokens_path;   /* Embedded tokens path */
+    int32_t max_tokens;             /* Maximum tokens */
+    bool    enable_thinking;        /* Enable thinking */
+    bool    verbose;                /* Verbose */
+} ml_ModelConfig;
+*/
+
+public struct ModelConfig: Codable {
+    public var nCtx: Int32
+    public var nThreads: Int32
+    public var nThreadsBatch: Int32
+    public var nBatch: Int32
+    public var nUbatch: Int32
+    public var nSeqMax: Int32
+
+    public var chatTemplatePath: String?
+    public var chatTemplateContent: String?
+
+    public static let `default`: ModelConfig = {
+        return .init(
+            nCtx: 2048,
+            nThreads: 0,
+            nThreadsBatch: 0,
+            nBatch: 0,
+            nUbatch: 0,
+            nSeqMax: 0,
+            chatTemplatePath: nil,
+            chatTemplateContent: nil
+        )
+    }()
+
+    public init(
+        nCtx: Int32 = 2048,
+        nThreads: Int32 = 0,
+        nThreadsBatch: Int32 = 0,
+        nBatch: Int32 = 0,
+        nUbatch: Int32 = 0,
+        nSeqMax: Int32 = 0,
+        chatTemplatePath: String? = nil,
+        chatTemplateContent: String? = nil
+    ) {
+        self.nCtx = nCtx
+        self.nThreads = nThreads
+        self.nThreadsBatch = nThreadsBatch
+        self.nBatch = nBatch
+        self.nUbatch = nUbatch
+        self.nSeqMax = nSeqMax
+        self.chatTemplatePath = chatTemplatePath
+        self.chatTemplateContent = chatTemplateContent
+    }
+}
@@ -0,0 +1,88 @@
+/*
+ /** Profiling data structure for LLM/VLM performance metrics */
+ typedef struct {
+     int64_t ttft;        /* Time to first token (us) */
+     int64_t prompt_time; /* Prompt processing time (us) */
+     int64_t decode_time; /* Token generation time (us) */
+
+     int64_t prompt_tokens;    /* Number of prompt tokens */
+     int64_t generated_tokens; /* Number of generated tokens */
+     int64_t audio_duration;   /* Audio duration (us) */
+
+     double prefill_speed;    /* Prefill speed (tokens/sec) */
+     double decoding_speed;   /* Decoding speed (tokens/sec) */
+     double real_time_factor; /* Real-Time Factor(RTF) (1.0 = real-time, >1.0 = faster, <1.0 = slower) */
+
+     const char* stop_reason; /* Stop reason: "eos", "length", "user", "stop_sequence" */
+ } ml_ProfileData;
+
+ */
+import NexaBridge
+
+public struct ProfileData: CustomStringConvertible {
+    public let ttft: Int64
+    public let promptTime: Int64
+    public let decodeTime: Int64
+
+    public let promptTokens: Int64
+    public let generatedTokens: Int64
+    public let audioDuration: Int64
+
+    public let prefillSpeed: Double
+    public let decodingSpeed: Double
+    public let realTimeFactor: Double
+
+    public let stopReason: String
+
+    public init(
+        ttft: Int64 = 0,
+        promptTime: Int64 = 0,
+        decodeTime: Int64 = 0,
+        promptTokens: Int64 = 0,
+        generatedTokens: Int64 = 0,
+        audioDuration: Int64 = 0,
+        prefillSpeed: Double = 0.0,
+        decodingSpeed: Double = 0.0,
+        realTimeFactor: Double = 0.0,
+        stopReason: String = ""
+    ) {
+        self.ttft = ttft
+        self.promptTime = promptTime
+        self.decodeTime = decodeTime
+        self.promptTokens = promptTokens
+        self.generatedTokens = generatedTokens
+        self.audioDuration = audioDuration
+        self.prefillSpeed = prefillSpeed
+        self.decodingSpeed = decodingSpeed
+        self.realTimeFactor = realTimeFactor
+        self.stopReason = stopReason
+    }
+
+    init(from cProfileData: ml_ProfileData) {
+        self.ttft = cProfileData.ttft
+        self.promptTime = cProfileData.prompt_time
+        self.decodeTime = cProfileData.decode_time
+        self.promptTokens = cProfileData.prompt_tokens
+        self.generatedTokens = cProfileData.generated_tokens
+        self.audioDuration = cProfileData.audio_duration
+        self.prefillSpeed = cProfileData.prefill_speed
+        self.decodingSpeed = cProfileData.decoding_speed
+        self.realTimeFactor = cProfileData.real_time_factor
+        self.stopReason = cProfileData.stop_reason == nil ? "" : String(cString: cProfileData.stop_reason!)
+    }
+
+    public var description: String {
+        """
+        TTFT: \(ttft) us
+        Prompt Time: \(promptTime) us
+        Decode Time: \(decodeTime) us
+        Prompt Tokens: \(promptTokens)
+        Generated Tokens: \(generatedTokens)
+        Audio Duration: \(audioDuration) us
+        Prefill Speed: \(prefillSpeed) t/s
+        Decoding Speed: \(decodingSpeed) t/s
+        Real Time Factor: \(realTimeFactor)
+        Stop reason: \(stopReason)
+        """
+    }
+}