netdur
diff --git a/‎android/llamalib/build.gradle‎
Lines changed: 8 additions & 4 deletions b/‎android/llamalib/build.gradle‎
Lines changed: 8 additions & 4 deletions
diff --git a/‎example/test.dart‎
Lines changed: 25 additions & 162 deletions b/‎example/test.dart‎
Lines changed: 25 additions & 162 deletions
diff --git a/‎example/test_vision.finetuned.dart‎
Lines changed: 6 additions & 4 deletions b/‎example/test_vision.finetuned.dart‎
Lines changed: 6 additions & 4 deletions
@@ -21,10 +21,14 @@ android {
                 cppFlags "-std=c++17", "-fexceptions", "-frtti"
                 arguments  "-DBUILD_SHARED_LIBS=ON",
                            "-DLLAMA_CURL=OFF",
-                           "-DGGML_VULKAN=ON",
-                           "-DGGML_VULKAN_COOPMAT_GLSLC_SUPPORT=OFF",
-                           "-DGGML_VULKAN_COOPMAT2_GLSLC_SUPPORT=OFF",
-                           "-DGGML_VULKAN_BFLOAT16_GLSLC_SUPPORT=OFF",
+
+                            // "-DGGML_OPENCL=ON",
+                            // "-DOpenCL_INCLUDE_DIR=/Users/adel/Workspace/OpenCL-Headers/include",
+
+                            // "-DGGML_VULKAN=ON",
+                           // "-DGGML_VULKAN_COOPMAT_GLSLC_SUPPORT=OFF",
+                           // "-DGGML_VULKAN_COOPMAT2_GLSLC_SUPPORT=OFF",
+                           // "-DGGML_VULKAN_BFLOAT16_GLSLC_SUPPORT=OFF",
                            // "-DVK_USE_PLATFORM_ANDROID_KHR=ON",
                            // "-DGGML_VULKAN_VALIDATE=OFF",
                            "-DLLAMA_BUILD_TESTS=OFF",
 
@@ -1,183 +1,46 @@
 // ignore_for_file: avoid_print
 
 import 'dart:io';
-import 'dart:convert';
-import 'package:http/http.dart' as http;
-import 'package:intl/intl.dart';
 import 'package:llama_cpp_dart/llama_cpp_dart.dart';
 
-// ==========================================================
-// TOOLS (No changes here, they are correct)
-// ==========================================================
+String prompt = """what is 2 * 4?""";
 
-/// Tool to get the current time.
-String getCurrentTime() {
-  final now = DateTime.now();
-  final formattedTime = DateFormat('HH:mm').format(now);
-  return "The current time is $formattedTime.";
-}
-
-/// Tool to get the weather for a city.
-Future<String> getWeather(String city) async {
-  try {
-    final url = Uri.parse('https://wttr.in/$city?format=%C,+%t');
-    final response = await http.get(url);
-    if (response.statusCode == 200) {
-      final body = response.body.trim();
-      if (body.contains(',')) {
-        return "The weather in $city is ${body.split(',')[0]} with a temperature of ${body.split(',')[1]}.";
-      }
-      return "Could not parse weather for $city. Response: $body";
-    } else {
-      return "Sorry, I couldn't get the weather for $city.";
-    }
-  } catch (e) {
-    return "An error occurred while fetching weather: $e";
-  }
-}
-
-final Map<String, Function> toolBox = {
-  'getCurrentTime': getCurrentTime,
-  'getWeather': getWeather,
-};
-
-// ==========================================================
-// PROMPT ENGINEERING
-// ==========================================================
-
-String buildToolDescriptions() {
-  return """
-- `getCurrentTime()`: Use this tool to get the current time. It takes no arguments.
-- `getWeather(city: string)`: Use this tool to get the weather for a specific city.
-""";
-}
-
-String buildSystemPrompt() {
-  return """
-You are an expert at choosing the right function to call to answer a user's question. You have access to the following tools:
-${buildToolDescriptions()}
-
-Your goal is to respond with ONLY a JSON object that represents the function call(s) needed.
-- The JSON should be an array of objects.
-- Each object must have a "tool_name" and an "arguments" map.
-- If no tool is needed, or if you don't have enough information (e.g., the user asks for weather but doesn't name a city), respond with an empty JSON array: `[]`.
-- Do NOT add any other text, explanation, or conversation.
-
-Example:
-User: What's the weather like in Paris?
-Your response:
-[
-  {"tool_name": "getWeather", "arguments": {"city": "Paris"}}
-]
-
-User: what time is it?
-Your response:
-[
-  {"tool_name": "getCurrentTime", "arguments": {}}
-]
-
-User: Tell me a joke.
-Your response:
-[]
-""";
-}
-
-// ==========================================================
-// MAIN AGENT LOGIC (This is where the fix is)
-// ==========================================================
-
-Future<void> main() async {
+void main() async {
   try {
-    // --- Standard LLM Setup (using your working example's structure) ---
     Llama.libraryPath = "bin/MAC_ARM64/libllama.dylib";
     String modelPath = "/Users/adel/Workspace/gguf/gemma-3-4b-it-q4_0.gguf";
 
-    final modelParams = ModelParams()..nGpuLayers = -1;
-    final contextParams = ContextParams()..nCtx = 2048;
-    final samplerParams = SamplerParams();
-
-    final llama =
-        Llama(modelPath, modelParams, contextParams, samplerParams, false);
-
-    // --- The Agent's Main Loop ---
-    while (true) {
-      stdout.write("\nAsk me something (or type 'exit'): ");
-      final userInput = stdin.readLineSync();
-
-      if (userInput == null || userInput.toLowerCase() == 'exit') {
-        break;
-      }
+    ChatHistory history = ChatHistory()
+      ..addMessage(role: Role.user, content: prompt)
+      ..addMessage(role: Role.assistant, content: "");
 
-      print("🧠 Thinking...");
+    final modelParams = ModelParams()..nGpuLayers = 99;
 
-      // 1. Build the prompt using ChatHistory (THE CORRECT WAY)
-      final history = ChatHistory()
-        ..addMessage(role: Role.user, content: buildSystemPrompt())
-        ..addMessage(role: Role.user, content: userInput)
-        ..addMessage(role: Role.assistant, content: '');
+    final contextParams = ContextParams()
+      ..nPredict = -1
+      ..nCtx = 8192
+      ..nBatch = 8192;
 
-      // 2. Set the prompt and get the response by streaming tokens (THE CORRECT WAY)
-      llama.setPrompt(history.exportFormat(ChatFormat.gemini,
-          leaveLastAssistantOpen: true));
+    final samplerParams = SamplerParams()
+      ..temp = 0.7
+      ..topK = 64
+      ..topP = 0.95
+      ..penaltyRepeat = 1.1;
 
-      final responseBuffer = StringBuffer();
-      while (true) {
-        final (token, done) = llama.getNext();
-        responseBuffer.write(token);
-        if (done) break;
-      }
-      final llmResponse = responseBuffer.toString().trim();
-
-      print("✅ LLM's Plan (raw response): $llmResponse");
-
-      // 3. The "Coordinator" (our code) reads the plan and executes it.
-      try {
-        final jsonRegex = RegExp(r'\[.*\]', dotAll: true);
-        final match = jsonRegex.firstMatch(llmResponse);
-
-        if (match == null) {
-          print(
-              "🤖 I couldn't decide on a tool to use. Here's my raw thought: $llmResponse");
-          continue;
-        }
-
-        final jsonString = match.group(0)!;
-        final List<dynamic> toolCalls = jsonDecode(jsonString);
-
-        if (toolCalls.isEmpty) {
-          print(
-              "🤖 I don't have a tool for that. Please ask me about the time or weather.");
-          continue;
-        }
-
-        // 4. Execute each tool in the plan
-        for (var call in toolCalls) {
-          final toolName = call['tool_name'];
-          final arguments = call['arguments'] as Map<String, dynamic>;
-          final tool = toolBox[toolName];
+    Llama llama =
+        Llama(modelPath, modelParams, contextParams, samplerParams, false);
 
-          if (tool != null) {
-            print("🛠️  Executing tool: $toolName with args: $arguments");
-            if (toolName == 'getWeather') {
-              final result = await getWeather(arguments['city']);
-              print("✔️  Result: $result");
-            } else if (toolName == 'getCurrentTime') {
-              final result = getCurrentTime();
-              print("✔️  Result: $result");
-            }
-          } else {
-            print("❌ Error: Tool '$toolName' not found in my toolbox.");
-          }
-        }
-      } catch (e) {
-        print("❌ Error processing the LLM's plan: $e");
-        print("   My plan was: $llmResponse");
-      }
+    llama.setPrompt(
+        history.exportFormat(ChatFormat.gemini, leaveLastAssistantOpen: true));
+    while (true) {
+      var (token, done) = llama.getNext();
+      stdout.write(token);
+      if (done) break;
     }
+    stdout.write("\n");
 
     llama.dispose();
-    print("Goodbye!");
   } catch (e) {
-    print("\nFatal Error: ${e.toString()}");
+    print("\nError: ${e.toString()}");
   }
 }
@@ -8,8 +8,9 @@ Future<void> main() async {
 
   final contextParams = ContextParams()
     ..nPredict = -1
-    ..nCtx = 8192
-    ..nBatch = 8192;
+    ..nCtx = 2048
+    ..nUbatch = 2048
+    ..nBatch = 2048;
 
   final samplerParams = SamplerParams()
     ..temp = 0.7
@@ -18,12 +19,13 @@ Future<void> main() async {
     ..penaltyRepeat = 1.1;
 
   final llama = Llama(
-      "/Users/adel/Downloads/gemma-3n-E2B-it-plantvillage-model-Q4_K_M.gguf",
+      // "/Users/adel/Downloads/gemma-3n-E2B-it-plantvillage-model.gguf",
+      "/Users/adel/Downloads/gemma-3-4B-it-plantvillage-model-Q4_K_M.gguf",
       modelParams,
       contextParams,
       samplerParams,
       true,
-      "/Users/adel/Downloads/gemma-3n-E2B-it-plantvillage -mmproj.gguf");
+      "/Users/adel/Downloads/gemma-3-4B-it-plantvillage-mmproj.gguf");
 
   final image =
       LlamaImage.fromFile(File("/Users/adel/Downloads/plantvillage-test.png"));