add vs 2019

Browse files

also remove old windows quantizing and add --upgrade just in case it tries to falsely install from cache

Files changed (14) hide show

auto-exl2-upload/INSTRUCTIONS.txt +3 -2
auto-exl2-upload/auto-exl2-upload.zip +2 -2
auto-exl2-upload/linux-setup.sh +2 -2
auto-exl2-upload/windows-setup.bat +2 -2
exl2-multi-quant-local/INSTRUCTIONS.txt +3 -2
exl2-multi-quant-local/exl2-multi-quant-local.zip +2 -2
exl2-multi-quant-local/linux-setup.sh +2 -2
exl2-multi-quant-local/windows-setup.bat +2 -2
exl2-windows-local/convert-model-auto.bat +0 -9
exl2-windows-local/download-model.bat +0 -5
exl2-windows-local/download-model.py +0 -323
exl2-windows-local/exl2-windows-local.zip +0 -3
exl2-windows-local/instructions.txt +0 -21
exl2-windows-local/windows-setup.bat +0 -58

auto-exl2-upload/INSTRUCTIONS.txt CHANGED Viewed

@@ -8,8 +8,9 @@ https://developer.nvidia.com/cuda-11-8-0-download-archive
 Restart your computer after installing the CUDA toolkit to make sure the PATH is set correctly.
-Haven't done much testing but for Windows, Visual Studio with desktop development for C++ might be required. I've gotten cl.exe errors on a previous install
 This may work with AMD cards but only on linux and possibly WSL2. I can't guarantee that it will work on AMD cards, I personally don't have one to test with. You may need to install stuff before starting. https://rocm.docs.amd.com/projects/install-on-linux/en/latest/tutorial/quick-start.html

 Restart your computer after installing the CUDA toolkit to make sure the PATH is set correctly.
+Haven't done much testing but for Windows, Visual Studio 2019 with desktop development for C++ might be required.
+https://visualstudio.microsoft.com/thank-you-downloading-visual-studio/?sku=community&rel=16&utm_medium=microsoft&utm_campaign=download+from+relnotes&utm_content=vs2019ga+button
+install the desktop development for C++ workload
 This may work with AMD cards but only on linux and possibly WSL2. I can't guarantee that it will work on AMD cards, I personally don't have one to test with. You may need to install stuff before starting. https://rocm.docs.amd.com/projects/install-on-linux/en/latest/tutorial/quick-start.html

auto-exl2-upload/auto-exl2-upload.zip CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a0302ff4a51b937ba9b964a7ab66cd8e6b365ea7d3a220b845f2abcc2df67d59
-size 6983

 version https://git-lfs.github.com/spec/v1
+oid sha256:2c2720bae3c941245912a72e95c2a4ad708e9118b1629a94ea473354705f045c
+size 7085

auto-exl2-upload/linux-setup.sh CHANGED Viewed

@@ -27,13 +27,13 @@ read -p "Please enter your GPU compute version, CUDA 11/12 or AMD ROCm (11, 12,
 if [ "$pytorch_version" = "11" ]; then
     echo "Installing PyTorch for CUDA 11.8"
-    venv/bin/python -m pip install torch --index-url https://download.pytorch.org/whl/cu118
 elif [ "$pytorch_version" = "12" ]; then
     echo "Installing PyTorch for CUDA 12.1"
     venv/bin/python -m pip install torch
 elif [ "$pytorch_version" = "rocm" ]; then
     echo "Installing PyTorch for AMD ROCm 5.7"
-    venv/bin/python -m pip install torch --index-url https://download.pytorch.org/whl/rocm5.7
 else
     echo "Invalid compute version. Please enter 11, 12, or rocm."
     read -p "Press enter to continue"

 if [ "$pytorch_version" = "11" ]; then
     echo "Installing PyTorch for CUDA 11.8"
+    venv/bin/python -m pip install torch --index-url https://download.pytorch.org/whl/cu118 --upgrade
 elif [ "$pytorch_version" = "12" ]; then
     echo "Installing PyTorch for CUDA 12.1"
     venv/bin/python -m pip install torch
 elif [ "$pytorch_version" = "rocm" ]; then
     echo "Installing PyTorch for AMD ROCm 5.7"
+    venv/bin/python -m pip install torch --index-url https://download.pytorch.org/whl/rocm5.7 --upgrade
 else
     echo "Invalid compute version. Please enter 11, 12, or rocm."
     read -p "Press enter to continue"

auto-exl2-upload/windows-setup.bat CHANGED Viewed

@@ -30,10 +30,10 @@ set /p cuda_version="Please enter your CUDA version (11 or 12): "
 if "%cuda_version%"=="11" (
     echo Installing PyTorch for CUDA 11.8...
-    venv\scripts\python.exe -m pip install torch --index-url https://download.pytorch.org/whl/cu118
 ) else if "%cuda_version%"=="12" (
     echo Installing PyTorch for CUDA 12.1...
-    venv\scripts\python.exe -m pip install torch --index-url https://download.pytorch.org/whl/cu121
 ) else (
     echo Invalid CUDA version. Please enter 11 or 12.
     pause

 if "%cuda_version%"=="11" (
     echo Installing PyTorch for CUDA 11.8...
+    venv\scripts\python.exe -m pip install torch --index-url https://download.pytorch.org/whl/cu118 --upgrade
 ) else if "%cuda_version%"=="12" (
     echo Installing PyTorch for CUDA 12.1...
+    venv\scripts\python.exe -m pip install torch --index-url https://download.pytorch.org/whl/cu121 --upgrade
 ) else (
     echo Invalid CUDA version. Please enter 11 or 12.
     pause

exl2-multi-quant-local/INSTRUCTIONS.txt CHANGED Viewed

@@ -8,8 +8,9 @@ https://developer.nvidia.com/cuda-11-8-0-download-archive
 Restart your computer after installing the CUDA toolkit to make sure the PATH is set correctly.
-Haven't done much testing but for Windows, Visual Studio with desktop development for C++ might be required. I've gotten cl.exe errors on a previous install
 This may work with AMD cards but only on linux and possibly WSL2. I can't guarantee that it will work on AMD cards, I personally don't have one to test with. You may need to install stuff before starting. https://rocm.docs.amd.com/projects/install-on-linux/en/latest/tutorial/quick-start.html

 Restart your computer after installing the CUDA toolkit to make sure the PATH is set correctly.
+Haven't done much testing but for Windows, Visual Studio 2019 with desktop development for C++ might be required.
+https://visualstudio.microsoft.com/thank-you-downloading-visual-studio/?sku=community&rel=16&utm_medium=microsoft&utm_campaign=download+from+relnotes&utm_content=vs2019ga+button
+install the desktop development for C++ workload
 This may work with AMD cards but only on linux and possibly WSL2. I can't guarantee that it will work on AMD cards, I personally don't have one to test with. You may need to install stuff before starting. https://rocm.docs.amd.com/projects/install-on-linux/en/latest/tutorial/quick-start.html

exl2-multi-quant-local/exl2-multi-quant-local.zip CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b575952eaf5c1e2c03f0a8f99fd38ffe2f5b8a6d6f20782b7caa36d6651d265a
-size 6001

 version https://git-lfs.github.com/spec/v1
+oid sha256:9a6b8c97cdc430994bb2c5ee50104e4a6852b56b87d5cf1984aa6309a53cac17
+size 6103

exl2-multi-quant-local/linux-setup.sh CHANGED Viewed

@@ -27,13 +27,13 @@ read -p "Please enter your GPU compute version, CUDA 11/12 or AMD ROCm (11, 12,
 if [ "$pytorch_version" = "11" ]; then
     echo "Installing PyTorch for CUDA 11.8"
-    venv/bin/python -m pip install torch --index-url https://download.pytorch.org/whl/cu118
 elif [ "$pytorch_version" = "12" ]; then
     echo "Installing PyTorch for CUDA 12.1"
     venv/bin/python -m pip install torch
 elif [ "$pytorch_version" = "rocm" ]; then
     echo "Installing PyTorch for AMD ROCm 5.7"
-    venv/bin/python -m pip install torch --index-url https://download.pytorch.org/whl/rocm5.7
 else
     echo "Invalid compute version. Please enter 11, 12, or rocm."
     read -p "Press enter to continue"

 if [ "$pytorch_version" = "11" ]; then
     echo "Installing PyTorch for CUDA 11.8"
+    venv/bin/python -m pip install torch --index-url https://download.pytorch.org/whl/cu118 --upgrade
 elif [ "$pytorch_version" = "12" ]; then
     echo "Installing PyTorch for CUDA 12.1"
     venv/bin/python -m pip install torch
 elif [ "$pytorch_version" = "rocm" ]; then
     echo "Installing PyTorch for AMD ROCm 5.7"
+    venv/bin/python -m pip install torch --index-url https://download.pytorch.org/whl/rocm5.7 --upgrade
 else
     echo "Invalid compute version. Please enter 11, 12, or rocm."
     read -p "Press enter to continue"

exl2-multi-quant-local/windows-setup.bat CHANGED Viewed

@@ -30,10 +30,10 @@ set /p cuda_version="Please enter your CUDA version (11 or 12): "
 if "%cuda_version%"=="11" (
     echo Installing PyTorch for CUDA 11.8...
-    venv\scripts\python.exe -m pip install torch --index-url https://download.pytorch.org/whl/cu118
 ) else if "%cuda_version%"=="12" (
     echo Installing PyTorch for CUDA 12.1...
-    venv\scripts\python.exe -m pip install torch --index-url https://download.pytorch.org/whl/cu121
 ) else (
     echo Invalid CUDA version. Please enter 11 or 12.
     pause

 if "%cuda_version%"=="11" (
     echo Installing PyTorch for CUDA 11.8...
+    venv\scripts\python.exe -m pip install torch --index-url https://download.pytorch.org/whl/cu118 --upgrade
 ) else if "%cuda_version%"=="12" (
     echo Installing PyTorch for CUDA 12.1...
+    venv\scripts\python.exe -m pip install torch --index-url https://download.pytorch.org/whl/cu121 --upgrade
 ) else (
     echo Invalid CUDA version. Please enter 11 or 12.
     pause

exl2-windows-local/convert-model-auto.bat DELETED Viewed

@@ -1,9 +0,0 @@
-@echo off
-set /p "model=Folder name: "
-set /p "bpw=Target BPW: "
-mkdir %model%-exl2-%bpw%bpw
-mkdir %model%-exl2-%bpw%bpw-WD
-copy %model%\config.json %model%-exl2-%bpw%bpw-WD
-venv\scripts\python.exe convert.py -i %model% -o %model%-exl2-%bpw%bpw-WD -cf %model%-exl2-%bpw%bpw -b %bpw%
-rmdir /s /q %model%-exl2-%bpw%-WD

exl2-windows-local/download-model.bat DELETED Viewed

@@ -1,5 +0,0 @@
-@echo off
-echo Enter the model repo. User/Repo:Branch (Branch optional)
-set /p "repo=Model repo: "
-venv\scripts\python.exe download-model.py %repo%

exl2-windows-local/download-model.py DELETED Viewed

@@ -1,323 +0,0 @@
-'''
-Downloads models from Hugging Face to models/username_modelname.
-Example:
-python download-model.py facebook/opt-1.3b
-'''
-import argparse
-import base64
-import datetime
-import hashlib
-import json
-import os
-import re
-import sys
-from pathlib import Path
-import requests
-import tqdm
-from requests.adapters import HTTPAdapter
-from tqdm.contrib.concurrent import thread_map
-from huggingface_hub import get_token
-base = "https://huggingface.co"
-class ModelDownloader:
-    def __init__(self, max_retries=5):
-        self.max_retries = max_retries
-    def get_session(self):
-        session = requests.Session()
-        if self.max_retries:
-            session.mount('https://cdn-lfs.huggingface.co', HTTPAdapter(max_retries=self.max_retries))
-            session.mount('https://huggingface.co', HTTPAdapter(max_retries=self.max_retries))
-        if os.getenv('HF_USER') is not None and os.getenv('HF_PASS') is not None:
-            session.auth = (os.getenv('HF_USER'), os.getenv('HF_PASS'))
-        try:
-            from huggingface_hub import get_token
-            token = get_token()
-        except ImportError:
-            token = os.getenv("HF_TOKEN")
-        if token is not None:
-            session.headers = {'authorization': f'Bearer {token}'}
-        return session
-    def sanitize_model_and_branch_names(self, model, branch):
-        if model[-1] == '/':
-            model = model[:-1]
-        if model.startswith(base + '/'):
-            model = model[len(base) + 1:]
-        model_parts = model.split(":")
-        model = model_parts[0] if len(model_parts) > 0 else model
-        branch = model_parts[1] if len(model_parts) > 1 else branch
-        if branch is None:
-            branch = "main"
-        else:
-            pattern = re.compile(r"^[a-zA-Z0-9._-]+$")
-            if not pattern.match(branch):
-                raise ValueError(
-                    "Invalid branch name. Only alphanumeric characters, period, underscore and dash are allowed.")
-        return model, branch
-    def get_download_links_from_huggingface(self, model, branch, text_only=False, specific_file=None):
-        session = self.get_session()
-        page = f"/api/models/{model}/tree/{branch}"
-        cursor = b""
-        links = []
-        sha256 = []
-        classifications = []
-        has_pytorch = False
-        has_pt = False
-        has_gguf = False
-        has_safetensors = False
-        is_lora = False
-        while True:
-            url = f"{base}{page}" + (f"?cursor={cursor.decode()}" if cursor else "")
-            r = session.get(url, timeout=10)
-            r.raise_for_status()
-            content = r.content
-            dict = json.loads(content)
-            if len(dict) == 0:
-                break
-            for i in range(len(dict)):
-                fname = dict[i]['path']
-                if specific_file not in [None, ''] and fname != specific_file:
-                    continue
-                if not is_lora and fname.endswith(('adapter_config.json', 'adapter_model.bin')):
-                    is_lora = True
-                is_pytorch = re.match(r"(pytorch|adapter|gptq)_model.*\.bin", fname)
-                is_safetensors = re.match(r".*\.safetensors", fname)
-                is_pt = re.match(r".*\.pt", fname)
-                is_gguf = re.match(r'.*\.gguf', fname)
-                is_tiktoken = re.match(r".*\.tiktoken", fname)
-                is_tokenizer = re.match(r"(tokenizer|ice|spiece).*\.model", fname) or is_tiktoken
-                is_text = re.match(r".*\.(txt|json|py|md)", fname) or is_tokenizer
-                if any((is_pytorch, is_safetensors, is_pt, is_gguf, is_tokenizer, is_text)):
-                    if 'lfs' in dict[i]:
-                        sha256.append([fname, dict[i]['lfs']['oid']])
-                    if is_text:
-                        links.append(f"https://huggingface.co/{model}/resolve/{branch}/{fname}")
-                        classifications.append('text')
-                        continue
-                    if not text_only:
-                        links.append(f"https://huggingface.co/{model}/resolve/{branch}/{fname}")
-                        if is_safetensors:
-                            has_safetensors = True
-                            classifications.append('safetensors')
-                        elif is_pytorch:
-                            has_pytorch = True
-                            classifications.append('pytorch')
-                        elif is_pt:
-                            has_pt = True
-                            classifications.append('pt')
-                        elif is_gguf:
-                            has_gguf = True
-                            classifications.append('gguf')
-            cursor = base64.b64encode(f'{{"file_name":"{dict[-1]["path"]}"}}'.encode()) + b':50'
-            cursor = base64.b64encode(cursor)
-            cursor = cursor.replace(b'=', b'%3D')
-        # If both pytorch and safetensors are available, download safetensors only
-        if (has_pytorch or has_pt) and has_safetensors:
-            for i in range(len(classifications) - 1, -1, -1):
-                if classifications[i] in ['pytorch', 'pt']:
-                    links.pop(i)
-        # For GGUF, try to download only the Q4_K_M if no specific file is specified.
-        # If not present, exclude all GGUFs, as that's likely a repository with both
-        # GGUF and fp16 files.
-        if has_gguf and specific_file is None:
-            has_q4km = False
-            for i in range(len(classifications) - 1, -1, -1):
-                if 'q4_k_m' in links[i].lower():
-                    has_q4km = True
-            if has_q4km:
-                for i in range(len(classifications) - 1, -1, -1):
-                    if 'q4_k_m' not in links[i].lower():
-                        links.pop(i)
-            else:
-                for i in range(len(classifications) - 1, -1, -1):
-                    if links[i].lower().endswith('.gguf'):
-                        links.pop(i)
-        is_llamacpp = has_gguf and specific_file is not None
-        return links, sha256, is_lora, is_llamacpp
-    def get_output_folder(self, model, branch, is_lora, is_llamacpp=False):
-        base_folder = '.' if not is_lora else 'loras'
-        # If the model is of type GGUF, save directly in the base_folder
-        if is_llamacpp:
-            return Path(base_folder)
-        output_folder = f"{'_'.join(model.split('/')[-2:])}"
-        if branch != 'main':
-            output_folder += f'_{branch}'
-        output_folder = Path(base_folder) / output_folder
-        return output_folder
-    def get_single_file(self, url, output_folder, start_from_scratch=False):
-        session = self.get_session()
-        filename = Path(url.rsplit('/', 1)[1])
-        output_path = output_folder / filename
-        headers = {}
-        mode = 'wb'
-        if output_path.exists() and not start_from_scratch:
-            # Check if the file has already been downloaded completely
-            r = session.get(url, stream=True, timeout=10)
-            total_size = int(r.headers.get('content-length', 0))
-            if output_path.stat().st_size >= total_size:
-                return
-            # Otherwise, resume the download from where it left off
-            headers = {'Range': f'bytes={output_path.stat().st_size}-'}
-            mode = 'ab'
-        with session.get(url, stream=True, headers=headers, timeout=10) as r:
-            r.raise_for_status()  # Do not continue the download if the request was unsuccessful
-            total_size = int(r.headers.get('content-length', 0))
-            block_size = 1024 * 1024  # 1MB
-            tqdm_kwargs = {
-                'total': total_size,
-                'unit': 'iB',
-                'unit_scale': True,
-                'bar_format': '{l_bar}{bar}| {n_fmt:6}/{total_fmt:6} {rate_fmt:6}'
-            }
-            if 'COLAB_GPU' in os.environ:
-                tqdm_kwargs.update({
-                    'position': 0,
-                    'leave': True
-                })
-            with open(output_path, mode) as f:
-                with tqdm.tqdm(**tqdm_kwargs) as t:
-                    count = 0
-                    for data in r.iter_content(block_size):
-                        t.update(len(data))
-                        f.write(data)
-                        if total_size != 0 and self.progress_bar is not None:
-                            count += len(data)
-                            self.progress_bar(float(count) / float(total_size), f"{filename}")
-    def start_download_threads(self, file_list, output_folder, start_from_scratch=False, threads=4):
-        thread_map(lambda url: self.get_single_file(url, output_folder, start_from_scratch=start_from_scratch), file_list, max_workers=threads, disable=True)
-    def download_model_files(self, model, branch, links, sha256, output_folder, progress_bar=None, start_from_scratch=False, threads=4, specific_file=None, is_llamacpp=False):
-        self.progress_bar = progress_bar
-        # Create the folder and writing the metadata
-        output_folder.mkdir(parents=True, exist_ok=True)
-        if not is_llamacpp:
-            metadata = f'url: https://huggingface.co/{model}\n' \
-                       f'branch: {branch}\n' \
-                       f'download date: {datetime.datetime.now().strftime("%Y-%m-%d %H:%M:%S")}\n'
-            sha256_str = '\n'.join([f'    {item[1]} {item[0]}' for item in sha256])
-            if sha256_str:
-                metadata += f'sha256sum:\n{sha256_str}'
-            metadata += '\n'
-            (output_folder / 'huggingface-metadata.txt').write_text(metadata)
-        if specific_file:
-            print(f"Downloading {specific_file} to {output_folder}")
-        else:
-            print(f"Downloading the model to {output_folder}")
-        self.start_download_threads(links, output_folder, start_from_scratch=start_from_scratch, threads=threads)
-    def check_model_files(self, model, branch, links, sha256, output_folder):
-        # Validate the checksums
-        validated = True
-        for i in range(len(sha256)):
-            fpath = (output_folder / sha256[i][0])
-            if not fpath.exists():
-                print(f"The following file is missing: {fpath}")
-                validated = False
-                continue
-            with open(output_folder / sha256[i][0], "rb") as f:
-                file_hash = hashlib.file_digest(f, "sha256").hexdigest()
-                if file_hash != sha256[i][1]:
-                    print(f'Checksum failed: {sha256[i][0]}  {sha256[i][1]}')
-                    validated = False
-                else:
-                    print(f'Checksum validated: {sha256[i][0]}  {sha256[i][1]}')
-        if validated:
-            print('[+] Validated checksums of all model files!')
-        else:
-            print('[-] Invalid checksums. Rerun download-model.py with the --clean flag.')
-if __name__ == '__main__':
-    parser = argparse.ArgumentParser()
-    parser.add_argument('MODEL', type=str, default=None, nargs='?')
-    parser.add_argument('--branch', type=str, default='main', help='Name of the Git branch to download from.')
-    parser.add_argument('--threads', type=int, default=4, help='Number of files to download simultaneously.')
-    parser.add_argument('--text-only', action='store_true', help='Only download text files (txt/json).')
-    parser.add_argument('--specific-file', type=str, default=None, help='Name of the specific file to download (if not provided, downloads all).')
-    parser.add_argument('--output', type=str, default=None, help='The folder where the model should be saved.')
-    parser.add_argument('--clean', action='store_true', help='Does not resume the previous download.')
-    parser.add_argument('--check', action='store_true', help='Validates the checksums of model files.')
-    parser.add_argument('--max-retries', type=int, default=5, help='Max retries count when get error in download time.')
-    args = parser.parse_args()
-    branch = args.branch
-    model = args.MODEL
-    specific_file = args.specific_file
-    if model is None:
-        print("Error: Please specify the model you'd like to download (e.g. 'python download-model.py facebook/opt-1.3b').")
-        sys.exit()
-    downloader = ModelDownloader(max_retries=args.max_retries)
-    # Clean up the model/branch names
-    try:
-        model, branch = downloader.sanitize_model_and_branch_names(model, branch)
-    except ValueError as err_branch:
-        print(f"Error: {err_branch}")
-        sys.exit()
-    # Get the download links from Hugging Face
-    links, sha256, is_lora, is_llamacpp = downloader.get_download_links_from_huggingface(model, branch, text_only=args.text_only, specific_file=specific_file)
-    # Get the output folder
-    if args.output:
-        output_folder = Path(args.output)
-    else:
-        output_folder = downloader.get_output_folder(model, branch, is_lora, is_llamacpp=is_llamacpp)
-    if args.check:
-        # Check previously downloaded files
-        downloader.check_model_files(model, branch, links, sha256, output_folder)
-    else:
-        # Download files
-        downloader.download_model_files(model, branch, links, sha256, output_folder, specific_file=specific_file, threads=args.threads, is_llamacpp=is_llamacpp)

exl2-windows-local/exl2-windows-local.zip DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:d1d305f32329e1c812ff858f6ca564c008ce02c0f1837c5f3560c62c7293d945
-size 5918

exl2-windows-local/instructions.txt DELETED Viewed

@@ -1,21 +0,0 @@
-install the CUDA toolkit
-Nvidia Maxwell or higher
-https://developer.nvidia.com/cuda-downloads?target_os=Windows&target_arch=x86_64
-Nvidia Kepler or higher
-https://developer.nvidia.com/cuda-11-8-0-download-archive?target_os=Windows&target_arch=x86_64
-Haven't done much testing but Visual Studio with desktop development for C++ might be required. I've gotten cl.exe errors on a previous install
-make sure you setup the environment by using windows-setup.bat
-after everything is done just download a model using download-model.bat
-to quant, use convert-model-auto.bat. Enter the model's folder name, then the BPW for the model
-You can always pause the quantization process by pressing Ctrl + C and typing exit. All progress will be stored in the WD (working directory) folder. You can resume where you left off by running the convert-model-auto.bat script with the same arguments you used before.
-Credit to turboderp for creating exllamav2 and the exl2 quantization method.
-https://github.com/turboderp
-Credit to oobabooga the original download script.
-https://github.com/oobabooga

exl2-windows-local/windows-setup.bat DELETED Viewed

@@ -1,58 +0,0 @@
-@echo off
-setlocal
-REM check if "venv" subdirectory exists, if not, create one
-if not exist "venv\" (
-    python -m venv venv
-) else (
-    echo venv directory already exists. If something is broken, delete everything but exl2-quant.py and run this script again.
-    pause
-    exit
-)
-REM ask if the user has git installed
-set /p gitinst="Do you have git installed? (y/n) "
-if "%gitinst%"=="y" (
-    echo Setting up environment
-) else (
-    echo Please install git before running this script.
-    pause
-    exit
-)
-REM if CUDA version 12 install pytorch for 12.1, else if CUDA 11 install pytorch for 11.8
-echo CUDA path: %CUDA_HOME%
-set /p cuda_version="Please enter your CUDA version (11 or 12): "
-if "%cuda_version%"=="11" (
-    echo Installing PyTorch for CUDA 11.8...
-    venv\scripts\python.exe -m pip install torch --index-url https://download.pytorch.org/whl/cu118 --upgrade
-) else if "%cuda_version%"=="12" (
-    echo Installing PyTorch for CUDA 12.1...
-    venv\scripts\python.exe -m pip install torch --index-url https://download.pytorch.org/whl/cu121 --upgrade
-) else (
-    echo Invalid CUDA version. Please enter 11 or 12.
-    pause
-    exit
-)
-REM download stuff
-echo Downloading files...
-git clone https://github.com/turboderp/exllamav2
-echo Installing pip packages...
-venv\scripts\python.exe -m pip install -r exllamav2/requirements.txt
-venv\scripts\python.exe -m pip install huggingface-hub
-venv\scripts\python.exe -m pip install .\exllamav2
-move download-model.bat exllamav2
-move convert-model-auto.bat exllamav2
-move download-model.py exllamav2
-move venv exllamav2
-powershell -c (New-Object Media.SoundPlayer "C:\Windows\Media\tada.wav").PlaySync();
-echo Environment setup complete. Read instructions.txt for further instructions.
-pause