kherud · kherud · Dec 20, 2023 · Dec 19, 2023 · Dec 19, 2023 · Dec 19, 2023
diff --git a/.gitignore b/.gitignore
@@ -30,6 +30,7 @@ build
 hs_err_pid*
 replay_pid*
 
+models/*.gguf
 src/main/cpp/de_kherud_llama_*.h
 src/main/resources/**/*.so
 src/main/resources/**/*.dylib

diff --git a/README.md b/README.md
@@ -25,11 +25,12 @@ There are multiple [examples](src/test/java/examples). Make sure to set `model.h
 ```bash
 mvn exec:java -Dexec.mainClass="examples.MainExample" -Dmodel.home="/path/to/models" -Dmodel.name="codellama-13b.Q5_K_M.gguf"
 ```
+Note: if your model is in the `models` directory, then you can ommit the `-Dmodel.home` property.
 
-You can also run some integration tests, which will automatically download a model to `model.home`:
+You can also run some integration tests, which will automatically download a model to the `models` directory:
 
 ```bash
-mvn verify -Dmodel.home=/path/to/models
+mvn verify
 ```
 
 ### No Setup required

diff --git a/build-args.cmake b/build-args.cmake
@@ -4,6 +4,9 @@ else()
     set(LLAMA_METAL_DEFAULT OFF)
 endif()
 
+# general
+option(LLAMA_NATIVE "llama: enable -march=native flag" ON)
+
 # instruction set specific
 if (LLAMA_NATIVE)
     set(INS_ENB OFF)
@@ -633,4 +636,4 @@ if (CMAKE_SYSTEM_NAME MATCHES "NetBSD")
 endif()
 if (CMAKE_SYSTEM_NAME MATCHES "OpenBSD")
     add_compile_definitions(_BSD_SOURCE)
-endif()
+endif()
diff --git a/models/README.md b/models/README.md
@@ -0,0 +1,3 @@
+# Local Model Directory
+This directory contains models which will be automatically downloaded
+for use in java-llama.cpp's unit tests.
diff --git a/pom.xml b/pom.xml
@@ -48,7 +48,8 @@
 		<junit.version>4.13.1</junit.version>
 		<test.plugin.version>3.2.3</test.plugin.version>
 		<project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
-		<integration.test.model>mistral-7b-instruct-v0.2.Q5_K_S.gguf</integration.test.model>
+		<model.home>${project.basedir}/models</model.home>
+		<integration.test.model>mistral-7b-instruct-v0.2.Q2_K.gguf</integration.test.model>
 		<integration.test.model.url>https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.2-GGUF/resolve/main/${integration.test.model}</integration.test.model.url>
 	</properties>
 
@@ -110,6 +111,7 @@
 					<systemPropertyVariables>
 						<propertyName>model.home</propertyName>
 						<integration.test.model>${integration.test.model}</integration.test.model>
+						<model.home>${model.home}</model.home>
 					</systemPropertyVariables>
 				</configuration>
 				<executions>

diff --git a/src/test/java/de/kherud/llama/LlamaModelIT.java b/src/test/java/de/kherud/llama/LlamaModelIT.java
@@ -86,7 +86,8 @@ public void testGenerateGrammar() {
 		String output = sb.toString();
 
 		Assert.assertTrue(output.matches("[ab]+"));
-		Assert.assertEquals(nPredict, model.encode(output).length);
+		int generated = model.encode(output).length;
+		Assert.assertTrue(generated > 0 && generated <= nPredict);
 	}
 
 	@Test
@@ -126,7 +127,8 @@ public void testCompleteGrammar() {
 				.setNPredict(nPredict);
 		String output = model.complete("", params);
 		Assert.assertTrue(output.matches("[ab]+"));
-		Assert.assertEquals(nPredict, model.encode(output).length);
+		int generated = model.encode(output).length;
+		Assert.assertTrue(generated > 0 && generated <= nPredict);
 	}
 
 	@Test

diff --git a/src/test/java/de/kherud/llama/ModelResolver.java b/src/test/java/de/kherud/llama/ModelResolver.java
@@ -1,5 +1,6 @@
 package de.kherud.llama;
 
+import java.io.File;
 import java.nio.file.Paths;
 
 
@@ -22,6 +23,9 @@ public enum ModelResolver {
   public String resolve() {
     String ret = System.getProperty(systemPropertyName);
     if(ret == null) {
+      if(new File("models").exists()) {
+        return "models";
+      }
       throw new IllegalArgumentException(String.format(errorMessage, systemPropertyName));
     }
     return ret;