diff options
| -rw-r--r-- | README.md | 4 | ||||
| -rw-r--r-- | context.txt | 9 | ||||
| -rw-r--r-- | models.h | 24 | ||||
| -rw-r--r-- | models.txt | 4 |
4 files changed, 40 insertions, 1 deletions
@@ -56,3 +56,7 @@ This builds a Docker image and drops you into a shell with the prompt binary and ```bash make clean ``` + +## Reading material + +- https://www.tinyllm.org/ diff --git a/context.txt b/context.txt new file mode 100644 index 0000000..12d3073 --- /dev/null +++ b/context.txt @@ -0,0 +1,9 @@ +Gandalf: wizard, Lord of the Rings, grey beard, staff, Istari, Grey Pilgrim, Mithrandir, fought Sauron, helped destroy One Ring. + +Frodo: hobbit, Lord of the Rings, Bilbo's nephew, Shire, carried One Ring to Mount Doom, Fellowship of the Ring. + +Example: Who is Gandalf? Gandalf is a wizard from The Lord of the Rings. +Example: Who is Frodo? Frodo is a hobbit from The Lord of the Rings. +Example: Who is Harry Potter? I don't have that information. + +Answer this question. Use only the facts from above. If unknown, say "I don't have that information." Just give the answer, no prefix: @@ -31,6 +31,30 @@ model_config models[] = { .min_p = 0.05f, .seed = LLAMA_DEFAULT_SEED, }, + { + .name = "phi-4-mini-instruct", + .filepath = "models/Phi-4-mini-instruct.Q2_K.gguf", + .n_gpu_layers = 0, + .use_mmap = false, + .n_ctx = 131072, + .n_batch = 4096, + .embeddings = false, + .temperature = 0.8f, + .min_p = 0.05f, + .seed = LLAMA_DEFAULT_SEED, + }, + { + .name = "tinyllama-1", + .filepath = "models/TinyLlama-1.1B-intermediate-step-1431k-3T-Q2_K.gguf", + .n_gpu_layers = 0, + .use_mmap = false, + .n_ctx = 2048, + .n_batch = 4096, + .embeddings = false, + .temperature = 0.8f, + .min_p = 0.05f, + .seed = LLAMA_DEFAULT_SEED, + }, }; const model_config *get_model_by_name(const char *name) { @@ -1 +1,3 @@ -https://huggingface.co/Felladrin/gguf-flan-t5-small/resolve/main/flan-t5-small.F16.gguf?download=true +https://huggingface.co/Felladrin/gguf-flan-t5-small/resolve/main/flan-t5-small.F16.gguf +https://huggingface.co/MaziyarPanahi/Phi-4-mini-instruct-GGUF/resolve/main/Phi-4-mini-instruct.Q2_K.gguf +https://huggingface.co/andrijdavid/TinyLlama-1.1B-intermediate-step-1431k-3T-GGUF/resolve/main/TinyLlama-1.1B-intermediate-step-1431k-3T-Q2_K.gguf |
