add more options + better readme

Browse files

Files changed (4) hide show

auto-exl2-upload/auto-exl2-upload.zip +2 -2
auto-exl2-upload/exl2-quant.py +25 -6
exl2-multi-quant-local/exl2-multi-quant-local.zip +2 -2
exl2-multi-quant-local/exl2-quant.py +14 -0

auto-exl2-upload/auto-exl2-upload.zip CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2672625552f8b5f8b32ba04ceac8e2c69a12ed3503c725bfd5c8d0f0bf0c5796
-size 7226

 version https://git-lfs.github.com/spec/v1
+oid sha256:9a85786265019ae7cda5806405f298f0803359920201db5dffb0958d55fbf76e
+size 7345

auto-exl2-upload/exl2-quant.py CHANGED Viewed

@@ -1,10 +1,11 @@
 #usually it's what is on the inside that counts, not this time. This script is a mess, but at least it works.
 #import required modules
-from huggingface_hub import login, get_token, whoami, repo_exists, file_exists, upload_folder, create_repo, upload_file, create_branch
 import os
 import sys
 import subprocess
 import glob
 #define os differences
 oname = os.name
@@ -142,12 +143,12 @@ if repo_exists(f"{whoami().get('name', None)}/{modelname}-exl2") == False:
     print("Writing model card...")
     with open('./README.md', 'w') as file:
         file.write(f"# Exl2 quants for [{modelname}](https://huggingface.co/{repo_url})\n\n")
-        file.write("## Automatically quantized using the auto quant from [hf-scripts](https://huggingface.co/anthonyg5005/hf-scripts)\n\n")
         file.write(f"Would recommend {whoami().get('name', None)} to change up this README to include more info.\n\n")
         file.write("### BPW:\n\n")
         for bpw in bpwvalue:
-            file.write(f"[{bpw}](https://huggingface.co/{whoami().get('name', None)}/{modelname}-exl2/tree/{bpw}bpw)\n\n")
-        file.write(f"\n\\\n[measurement.json](https://huggingface.co/{whoami().get('name', None)}/{modelname}-exl2/raw/main/measurement.json)\n\n")
     print("Created README.md")
     upload_file(path_or_fileobj="README.md", path_in_repo="README.md", repo_id=f"{whoami().get('name', None)}/{modelname}-exl2", commit_message="Add temp README") #upload md file
@@ -186,9 +187,25 @@ for bpw in bpwvalue:
 if file_exists(f"{whoami().get('name', None)}/{modelname}-exl2", "measurement.json") == False: #check if measurement.json exists in main
     upload_file(path_or_fileobj=f"measurements{slsh}{model}-measure{slsh}measurement.json", path_in_repo="measurement.json", repo_id=f"{whoami().get('name', None)}/{modelname}-exl2", commit_message="Add measurement.json") #upload measurement.json to main
-print(f'''Quants available at https://huggingface.co/{whoami().get('name', None)}/{modelname}-exl2
-      \nRepo is private, go to https://huggingface.co/{whoami().get('name', None)}/{modelname}-exl2/settings to make public if you'd like.''')
 if tfound == 'false':
     print(f'''
@@ -197,3 +214,5 @@ if tfound == 'false':
           To logout, use the hf command line interface 'huggingface-cli logout'
                To view your active account, use 'huggingface-cli whoami'
           ''')

 #usually it's what is on the inside that counts, not this time. This script is a mess, but at least it works.
 #import required modules
+from huggingface_hub import login, get_token, whoami, repo_exists, file_exists, upload_folder, create_repo, upload_file, create_branch, update_repo_visibility
 import os
 import sys
 import subprocess
 import glob
+import time
 #define os differences
 oname = os.name
     print("Writing model card...")
     with open('./README.md', 'w') as file:
         file.write(f"# Exl2 quants for [{modelname}](https://huggingface.co/{repo_url})\n\n")
+        file.write("## Automatically quantized using the auto quant script from [hf-scripts](https://huggingface.co/anthonyg5005/hf-scripts)\n\n")
         file.write(f"Would recommend {whoami().get('name', None)} to change up this README to include more info.\n\n")
         file.write("### BPW:\n\n")
         for bpw in bpwvalue:
+            file.write(f"[{bpw}](https://huggingface.co/{whoami().get('name', None)}/{modelname}-exl2/tree/{bpw}bpw)\\\n")
+        file.write(f"[measurement.json](https://huggingface.co/{whoami().get('name', None)}/{modelname}-exl2/resolve/main/measurement.json?download=true)\n")
     print("Created README.md")
     upload_file(path_or_fileobj="README.md", path_in_repo="README.md", repo_id=f"{whoami().get('name', None)}/{modelname}-exl2", commit_message="Add temp README") #upload md file
 if file_exists(f"{whoami().get('name', None)}/{modelname}-exl2", "measurement.json") == False: #check if measurement.json exists in main
     upload_file(path_or_fileobj=f"measurements{slsh}{model}-measure{slsh}measurement.json", path_in_repo="measurement.json", repo_id=f"{whoami().get('name', None)}/{modelname}-exl2", commit_message="Add measurement.json") #upload measurement.json to main
+clear_screen()
+delmodel = input("Do you want to delete the original model? (y/n): ")
+while delmodel != 'y' and delmodel != 'n':
+    delmodel = input("Please enter 'y' or 'n': ")
+if delmodel == 'y':
+    subprocess.run(f"{osrmd} models{slsh}{model}", shell=True)
+    print(f"Deleted models/{model}")
+    time.sleep(2)
+clear_screen()
+priv2pub = input("Do you want to make the repo public? (y/n): ")
+while priv2pub != 'y' and priv2pub != 'n':
+    priv2pub = input("Please enter 'y' or 'n': ")
+if priv2pub == 'y':
+    update_repo_visibility(f"{whoami().get('name', None)}/{modelname}-exl2", private=False)
+    print("Repo is now public.")
+    time.sleep(2)
+clear_screen()
 if tfound == 'false':
     print(f'''
           To logout, use the hf command line interface 'huggingface-cli logout'
                To view your active account, use 'huggingface-cli whoami'
           ''')
+print(f'''Quants available at https://huggingface.co/{whoami().get('name', None)}/{modelname}-exl2''')

exl2-multi-quant-local/exl2-multi-quant-local.zip CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1ebc7c1e3b36a76ef3bfc3492caf0c2f76d16cb16e973ac717ef50a073db0d5f
-size 6249

 version https://git-lfs.github.com/spec/v1
+oid sha256:5d8efd32962bf1a775796bb5ae0500c56f2e2f5fc43335734926edd89db858a2
+size 6357

exl2-multi-quant-local/exl2-quant.py CHANGED Viewed

@@ -71,6 +71,14 @@ qmount = int(input("Enter the number of quants you want to create: "))
 qmount += 1
 clear_screen()
 #save bpw values
 print(f"Type the BPW for the following {qmount - 1} quants. Recommend staying over 2.4 BPW. Use the vram calculator to find the best BPW values: https://huggingface.co/spaces/NyxKrage/LLM-Model-VRAM-Calculator")
 qnum = {}
@@ -131,6 +139,12 @@ for bpw in bpwvalue:
         subprocess.run(f"{oscp} {model}-exl2-{bpw}bpw-WD{slsh}measurement.json measurements{slsh}{model}-measure", shell=True) #copy measurement to measure directory
         open(f"measurements{slsh}{model}-measure/Delete folder when no more quants are needed from this model", 'w').close()
     subprocess.run(f"{osrmd} {model}-exl2-{bpw}bpw-WD", shell=True) #remove working directory
 if tfound == 'false':
     print(f'''

 qmount += 1
 clear_screen()
+delmodel = input("Do you want to delete the original model after finishing? (Won't delete if canceled or failed) (y/n): ")
+while delmodel != 'y' and delmodel != 'n':
+    delmodel = input("Please enter 'y' or 'n': ")
+if delmodel == 'y':
+    print(f"Deleting dir models/{model} after quants are finished.")
+    time.sleep(3)
+clear_screen()
 #save bpw values
 print(f"Type the BPW for the following {qmount - 1} quants. Recommend staying over 2.4 BPW. Use the vram calculator to find the best BPW values: https://huggingface.co/spaces/NyxKrage/LLM-Model-VRAM-Calculator")
 qnum = {}
         subprocess.run(f"{oscp} {model}-exl2-{bpw}bpw-WD{slsh}measurement.json measurements{slsh}{model}-measure", shell=True) #copy measurement to measure directory
         open(f"measurements{slsh}{model}-measure/Delete folder when no more quants are needed from this model", 'w').close()
     subprocess.run(f"{osrmd} {model}-exl2-{bpw}bpw-WD", shell=True) #remove working directory
+if delmodel == 'y':
+    subprocess.run(f"{osrmd} models{slsh}{model}", shell=True)
+    print(f"Deleted models/{model}")
+    time.sleep(2)
+clear_screen()
 if tfound == 'false':
     print(f'''