mrm8488 commited on
Commit
8898865
1 Parent(s): 5249909

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +11 -10
README.md CHANGED
@@ -65,10 +65,14 @@ The following hyperparameters were used during training:
65
 
66
  ### Training results
67
 
68
- | Training Loss | Epoch | Step | Validation Loss |
69
- |:-------------:|:-----:|:----:|:---------------:|
70
- | 1.7917 | 0.72 | 5 | 1.7604 |
71
- | 1.7743 | 1.44 | 10 | 1.7217 |
 
 
 
 
72
 
73
 
74
  ### Usage
@@ -76,13 +80,10 @@ The following hyperparameters were used during training:
76
  import torch
77
  from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
78
 
79
- model_id = "mrm8488/limstral-7B-v0.1"
80
- tokenizer = "mrm8488/limstral-7B-v0.1"
81
-
82
- model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=torch.bfloat16)
83
- tokenizer = AutoTokenizer.from_pretrained(model_id)
84
 
85
- model.resize_token_embeddings(len(tokenizer))
 
86
 
87
  gen = pipeline("text-generation", model=model, tokenizer=tokenizer, device=0)
88
 
 
65
 
66
  ### Training results
67
 
68
+ | Step | Training Loss | Validation Loss |
69
+ |------|---------------|-----------------|
70
+ | 5 | 1.802800 | 1.848371 |
71
+ | 10 | 1.605800 | 1.803416 |
72
+ | 15 | 1.844800 | 1.762276 |
73
+ | 20 | 1.752600 | 1.754042 |
74
+ | 25 | 1.512400 | 1.750550 |
75
+
76
 
77
 
78
  ### Usage
 
80
  import torch
81
  from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
82
 
83
+ repo_id = "mrm8488/limstral-7B-v0.1"
 
 
 
 
84
 
85
+ model = AutoModelForCausalLM.from_pretrained(repo_id, torch_dtype=torch.bfloat16)
86
+ tokenizer = AutoTokenizer.from_pretrained(repo_id)
87
 
88
  gen = pipeline("text-generation", model=model, tokenizer=tokenizer, device=0)
89