From 223f2d9a0ba53820192f9d95850284f484fd6cf4 Mon Sep 17 00:00:00 2001 From: neutrino2211 Date: Mon, 22 Dec 2025 21:47:52 +0000 Subject: [PATCH] Add runpod/inflect.toml --- runpod/inflect.toml | 36 ++++++++++++++++++++++++++++++++++++ 1 file changed, 36 insertions(+) create mode 100644 runpod/inflect.toml diff --git a/runpod/inflect.toml b/runpod/inflect.toml new file mode 100644 index 0000000..dfb3e4c --- /dev/null +++ b/runpod/inflect.toml @@ -0,0 +1,36 @@ +# Inflectfile + +version = 1 + +[package] +name = "runpod" +version = "1.0.0" +description = "A basic inflection system based on two research papers" +license = "MIT" +publisher = "QRK labs " +maintainer = "QRK labs " +contact = "contact@qrk.ng" +published_at = "2025-09-23" + +[models] +"qwen3-1.7b" = "https://huggingface.co/unsloth/Qwen3-1.7B-GGUF/resolve/main/Qwen3-1.7B-Q8_0.gguf?download=true" +qwen3-4b = "https://huggingface.co/unsloth/Qwen3-4B-GGUF/resolve/main/Qwen3-4B-Q8_0.gguf?download=true" +bge-m3 = "https://huggingface.co/gpustack/bge-m3-GGUF/resolve/main/bge-m3-FP16.gguf?download=true" + +[knowledge_files] +papers = "https://git.mainasara.dev/qrk/knowledge/raw/branch/main/malik/all_insights.json" + +[kernel] +file = "https://git.mainasara.dev/qrk/knowledge/raw/branch/main/kernel.js" +runtime = "js" +runtime_version = "1.0.0" + +[systems.main] +language_model = "qwen3-4b" +embedding_model = "bge-m3" +knowledge_files = ["papers"] + +[systems.mini] +language_model = "qwen3-1.7b" +embedding_model = "bge-m3" +knowledge_files = ["papers"]