tinybiggames
/

Phi-3-mini-4k-instruct-Q4_K_M-GGUF

@@ -22,13 +22,13 @@ widget:
 # tinybiggames/Phi-3-mini-4k-instruct-Q4_K_M-GGUF
 This model was converted to GGUF format from [`microsoft/Phi-3-mini-4k-instruct`](https://huggingface.co/microsoft/Phi-3-mini-4k-instruct) using llama.cpp via the ggml.ai's [GGUF-my-repo](https://huggingface.co/spaces/ggml-org/gguf-my-repo) space.
 Refer to the [original model card](https://huggingface.co/microsoft/Phi-3-mini-4k-instruct) for more details on the model.
-## Use with tinyBigGAMES's [LMEngine Inference Library](https://github.com/tinyBigGAMES/LMEngine)
 How to configure LMEngine:
 ```Delphi
-LME_InitConfig(
  'C:/LLM/gguf', // path to model files
  -1             // number of GPU layer, -1 to use all available layers
 );
@@ -37,7 +37,7 @@ LME_InitConfig(
 How to define model:
 ```Delphi
-LME_DefineModel('phi-3-mini-4k-instruct.Q4_K_M.gguf',
   'phi-3-mini-4k-instruct.Q4_K_M', 4000,
   '<|{role}|>{content}<|end|>',
   '<|assistant|>');
@@ -46,7 +46,7 @@ LME_DefineModel('phi-3-mini-4k-instruct.Q4_K_M.gguf',
 How to add a message:
 ```Delphi
-LME_AddMessage(
   LME_ROLE_USER,    // role
  'What is AI?'  // content
 );
@@ -64,17 +64,17 @@ var
   LOutputTokens: Int32;
   LTotalTokens: Int32;
-if LME_RunInference('phi-3-mini-4k-instruct.Q4_K_M', 1024) then
   begin
-    LME_GetInferenceStats(nil, @LTokenOutputSpeed, @LInputTokens, @LOutputTokens,
       @LTotalTokens);
-    LME_PrintLn('', LME_FG_WHITE);
-    LME_PrintLn('Tokens :: Input: %d, Output: %d, Total: %d, Speed: %3.1f t/s',
-      LME_FG_BRIGHTYELLOW, LInputTokens, LOutputTokens, LTotalTokens, LTokenOutputSpeed);
   end
 else
   begin
-    LME_PrintLn('', LME_FG_WHITE);
-    LME_PrintLn('Error: %s', LME_FG_RED, LME_GetError());
   end;
 ```

 # tinybiggames/Phi-3-mini-4k-instruct-Q4_K_M-GGUF
 This model was converted to GGUF format from [`microsoft/Phi-3-mini-4k-instruct`](https://huggingface.co/microsoft/Phi-3-mini-4k-instruct) using llama.cpp via the ggml.ai's [GGUF-my-repo](https://huggingface.co/spaces/ggml-org/gguf-my-repo) space.
 Refer to the [original model card](https://huggingface.co/microsoft/Phi-3-mini-4k-instruct) for more details on the model.
+## Use with tinyBigGAMES's [Inference](https://github.com/tinyBigGAMES) Libraries.
 How to configure LMEngine:
 ```Delphi
+InitConfig(
  'C:/LLM/gguf', // path to model files
  -1             // number of GPU layer, -1 to use all available layers
 );
 How to define model:
 ```Delphi
+DefineModel('phi-3-mini-4k-instruct.Q4_K_M.gguf',
   'phi-3-mini-4k-instruct.Q4_K_M', 4000,
   '<|{role}|>{content}<|end|>',
   '<|assistant|>');
 How to add a message:
 ```Delphi
+AddMessage(
   LME_ROLE_USER,    // role
  'What is AI?'  // content
 );
   LOutputTokens: Int32;
   LTotalTokens: Int32;
+if RunInference('phi-3-mini-4k-instruct.Q4_K_M', 1024) then
   begin
+    GetInferenceStats(nil, @LTokenOutputSpeed, @LInputTokens, @LOutputTokens,
       @LTotalTokens);
+    PrintLn('', LME_FG_WHITE);
+    PrintLn('Tokens :: Input: %d, Output: %d, Total: %d, Speed: %3.1f t/s',
+      FG_BRIGHTYELLOW, LInputTokens, LOutputTokens, LTotalTokens, LTokenOutputSpeed);
   end
 else
   begin
+    PrintLn('', FG_WHITE);
+    PrintLn('Error: %s', FG_RED, LME_GetError());
   end;
 ```