Spaces:
Running
Running
File size: 1,292 Bytes
341de97 1f125f1 52c67ef |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 |
import torch
from transformers import AutoModelForCausalLM, AutoTokenizer
def get_values_per_byte(base: int):
values_per_byte = 1
tmp = 255 // base
while tmp > 0:
values_per_byte += 1
tmp = tmp // base
return values_per_byte
def bytes_to_base(m: bytes, base: int) -> list[int]:
values_per_byte = get_values_per_byte(base)
values = []
for b in m:
tmp = []
for i in range(values_per_byte):
tmp.append(b % base)
b = b // base
values.extend(tmp[::-1])
return values
def base_to_bytes(values: list[int], base: int) -> bytes:
values_per_byte = get_values_per_byte(base)
arr = bytearray()
i = 0
while i < len(values):
tmp = 0
for _ in range(values_per_byte):
tmp = tmp * base + values[i]
i += 1
if i >= len(values):
break
arr.append(tmp)
return bytes(arr)
def load_model(name: str, device: torch.device):
model = AutoModelForCausalLM.from_pretrained(name)
model.to(device)
model.eval()
tokenizer = AutoTokenizer.from_pretrained(name)
return model, tokenizer
def static_init(cls):
if getattr(cls, "__static_init__", None):
cls.__static_init__()
return cls
|