tinybiggames
/

dolphin-2.9.1-llama-3-8b-Q4_K_M-GGUF

Generated from Trainer

Model card Files Files and versions Community

tinybiggames commited on Jun 4

Commit

a86f565

•

1 Parent(s): 99a890b

Update README.md

Files changed (1) hide show

README.md +11 -11

README.md CHANGED Viewed

@@ -30,7 +30,7 @@ Refer to the [original model card](https://huggingface.co/cognitivecomputations/
 How to configure LMEngine:
 ```Delphi
-Config_Init(
  'C:/LLM/gguf', // path to model files
  -1             // number of GPU layer, -1 to use all available layers
 );
@@ -39,7 +39,7 @@ Config_Init(
 How to define model:
 ```Delphi
-Model_Define('dolphin-2.9.1-llama-3-8b.Q4_K_M.gguf',
   'dolphin-2.9.1-llama-3-8b.Q4_K_M', 8000,
   '<|im_start|>{role}\n{content}<|im_end|>\n',
   '<|im_start|>assistant');
@@ -48,8 +48,8 @@ Model_Define('dolphin-2.9.1-llama-3-8b.Q4_K_M.gguf',
 How to add a message:
 ```Delphi
-Message_Add(
-  ROLE_USER,    // role
  'What is AI?'  // content
 );
 ```
@@ -66,17 +66,17 @@ var
   LOutputTokens: Int32;
   LTotalTokens: Int32;
-if Inference_Run('dolphin-2.9.1-llama-3-8b.Q4_K_M', 1024) then
   begin
-    Inference_GetUsage(nil, @LTokenOutputSpeed, @LInputTokens, @LOutputTokens,
       @LTotalTokens);
-    Console_PrintLn('', FG_WHITE);
-    Console_PrintLn('Tokens :: Input: %d, Output: %d, Total: %d, Speed: %3.1f t/s',
-      FG_BRIGHTYELLOW, LInputTokens, LOutputTokens, LTotalTokens, LTokenOutputSpeed);
   end
 else
   begin
-    Console_PrintLn('', FG_WHITE);
-    Console_PrintLn('Error: %s', FG_RED, Error_Get());
   end;
 ```

 How to configure LMEngine:
 ```Delphi
+LME_InitConfig(
  'C:/LLM/gguf', // path to model files
  -1             // number of GPU layer, -1 to use all available layers
 );
 How to define model:
 ```Delphi
+LME_DefineModel('dolphin-2.9.1-llama-3-8b.Q4_K_M.gguf',
   'dolphin-2.9.1-llama-3-8b.Q4_K_M', 8000,
   '<|im_start|>{role}\n{content}<|im_end|>\n',
   '<|im_start|>assistant');
 How to add a message:
 ```Delphi
+LME_AddMessage(
+  LME_ROLE_USER,    // role
  'What is AI?'  // content
 );
 ```
   LOutputTokens: Int32;
   LTotalTokens: Int32;
+if LME_RunInference('dolphin-2.9.1-llama-3-8b.Q4_K_M', 1024) then
   begin
+    LME_GetInferenceStats(nil, @LTokenOutputSpeed, @LInputTokens, @LOutputTokens,
       @LTotalTokens);
+    LME_PrintLn('', LME_FG_WHITE);
+    LME_PrintLn('Tokens :: Input: %d, Output: %d, Total: %d, Speed: %3.1f t/s',
+      LME_FG_BRIGHTYELLOW, LInputTokens, LOutputTokens, LTotalTokens, LTokenOutputSpeed);
   end
 else
   begin
+    LME_PrintLn('', LME_FG_WHITE);
+    LME_PrintLn('Error: %s', LME_FG_RED, LME_GetError());
   end;
 ```