tinybiggames
/

dolphin-2.9.1-llama-3-8b-Q4_K_M-GGUF

@@ -24,13 +24,13 @@ model-index:
 # tinybiggames/dolphin-2.9.1-llama-3-8b-Q4_K_M-GGUF
 This model was converted to GGUF format from [`cognitivecomputations/dolphin-2.9.1-llama-3-8b`](https://huggingface.co/cognitivecomputations/dolphin-2.9.1-llama-3-8b) using llama.cpp via the ggml.ai's [GGUF-my-repo](https://huggingface.co/spaces/ggml-org/gguf-my-repo) space.
 Refer to the [original model card](https://huggingface.co/cognitivecomputations/dolphin-2.9.1-llama-3-8b) for more details on the model.
-## Use with tinyBigGAMES's [LMEngine Inference Library](https://github.com/tinyBigGAMES/LMEngine)
 How to configure LMEngine:
 ```Delphi
-LME_InitConfig(
  'C:/LLM/gguf', // path to model files
  -1             // number of GPU layer, -1 to use all available layers
 );
@@ -39,7 +39,7 @@ LME_InitConfig(
 How to define model:
 ```Delphi
-LME_DefineModel('dolphin-2.9.1-llama-3-8b.Q4_K_M.gguf',
   'dolphin-2.9.1-llama-3-8b.Q4_K_M', 8000,
   '<|im_start|>{role}\n{content}<|im_end|>\n',
   '<|im_start|>assistant');
@@ -48,8 +48,8 @@ LME_DefineModel('dolphin-2.9.1-llama-3-8b.Q4_K_M.gguf',
 How to add a message:
 ```Delphi
-LME_AddMessage(
-  LME_ROLE_USER,    // role
  'What is AI?'  // content
 );
 ```
@@ -66,17 +66,17 @@ var
   LOutputTokens: Int32;
   LTotalTokens: Int32;
-if LME_RunInference('dolphin-2.9.1-llama-3-8b.Q4_K_M', 1024) then
   begin
-    LME_GetInferenceStats(nil, @LTokenOutputSpeed, @LInputTokens, @LOutputTokens,
       @LTotalTokens);
-    LME_PrintLn('', LME_FG_WHITE);
-    LME_PrintLn('Tokens :: Input: %d, Output: %d, Total: %d, Speed: %3.1f t/s',
-      LME_FG_BRIGHTYELLOW, LInputTokens, LOutputTokens, LTotalTokens, LTokenOutputSpeed);
   end
 else
   begin
-    LME_PrintLn('', LME_FG_WHITE);
-    LME_PrintLn('Error: %s', LME_FG_RED, LME_GetError());
   end;
 ```

 # tinybiggames/dolphin-2.9.1-llama-3-8b-Q4_K_M-GGUF
 This model was converted to GGUF format from [`cognitivecomputations/dolphin-2.9.1-llama-3-8b`](https://huggingface.co/cognitivecomputations/dolphin-2.9.1-llama-3-8b) using llama.cpp via the ggml.ai's [GGUF-my-repo](https://huggingface.co/spaces/ggml-org/gguf-my-repo) space.
 Refer to the [original model card](https://huggingface.co/cognitivecomputations/dolphin-2.9.1-llama-3-8b) for more details on the model.
+## Use with tinyBigGAMES's [Inference](https://github.com/tinyBigGAMES) Libraries.
 How to configure LMEngine:
 ```Delphi
+InitConfig(
  'C:/LLM/gguf', // path to model files
  -1             // number of GPU layer, -1 to use all available layers
 );
 How to define model:
 ```Delphi
+DefineModel('dolphin-2.9.1-llama-3-8b.Q4_K_M.gguf',
   'dolphin-2.9.1-llama-3-8b.Q4_K_M', 8000,
   '<|im_start|>{role}\n{content}<|im_end|>\n',
   '<|im_start|>assistant');
 How to add a message:
 ```Delphi
+AddMessage(
+  ROLE_USER,    // role
  'What is AI?'  // content
 );
 ```
   LOutputTokens: Int32;
   LTotalTokens: Int32;
+if RunInference('dolphin-2.9.1-llama-3-8b.Q4_K_M', 1024) then
   begin
+    GetInferenceStats(nil, @LTokenOutputSpeed, @LInputTokens, @LOutputTokens,
       @LTotalTokens);
+    PrintLn('', FG_WHITE);
+    PrintLn('Tokens :: Input: %d, Output: %d, Total: %d, Speed: %3.1f t/s',
+      FG_BRIGHTYELLOW, LInputTokens, LOutputTokens, LTotalTokens, LTokenOutputSpeed);
   end
 else
   begin
+    PrintLn('', FG_WHITE);
+    PrintLn('Error: %s', FG_RED, GetError());
   end;
 ```