{ "cells": [ { "cell_type": "code", "execution_count": 1, "id": "19fe0df6", "metadata": {}, "outputs": [], "source": [ "# !pip3 install https://github.com/casper-hansen/AutoAWQ/releases/download/v0.1.8/autoawq-0.1.8+cu118-cp310-cp310-linux_x86_64.whl" ] }, { "cell_type": "code", "execution_count": 2, "id": "47528ce3", "metadata": {}, "outputs": [], "source": [ "import os\n", "\n", "os.environ['CUDA_VISIBLE_DEVICES'] = '1'" ] }, { "cell_type": "code", "execution_count": 3, "id": "20861f3e", "metadata": {}, "outputs": [], "source": [ "from awq import AutoAWQForCausalLM\n", "from transformers import AutoConfig, AwqConfig, AutoTokenizer, AutoModelForCausalLM\n", "import torch\n", "\n", "model_path = 'mesolitica/malaysian-mistral-7b-32k-instructions-v4'" ] }, { "cell_type": "code", "execution_count": 4, "id": "9939ad4e", "metadata": { "scrolled": true }, "outputs": [ { "data": { "application/vnd.jupyter.widget-view+json": { "model_id": "21aaf06156a0404fab259a4b45a92d6a", "version_major": 2, "version_minor": 0 }, "text/plain": [ "Loading checkpoint shards: 0%| | 0/3 [00:00