Spaces:

yazan-istatiyeh
/

STAR-nasa-spaceappschallenge

Runtime error

App Files Files Community

yazan-istatiyeh commited on Oct 10, 2023

Commit

9b7711f

•

1 Parent(s): d65fc88

Added files and database

Browse files

Files changed (9) hide show

.gitattributes +2 -0
demo.py +116 -0
distilbert/88cf4ce2-b959-412a-9bef-3f16720e41fa/data_level0.bin +3 -0
distilbert/88cf4ce2-b959-412a-9bef-3f16720e41fa/header.bin +3 -0
distilbert/88cf4ce2-b959-412a-9bef-3f16720e41fa/index_metadata.pickle +3 -0
distilbert/88cf4ce2-b959-412a-9bef-3f16720e41fa/length.bin +3 -0
distilbert/88cf4ce2-b959-412a-9bef-3f16720e41fa/link_lists.bin +3 -0
distilbert/chroma.sqlite3 +3 -0
requirements.txt +171 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+distilbert/88cf4ce2-b959-412a-9bef-3f16720e41fa filter=lfs diff=lfs merge=lfs -text
+distilbert/chroma.sqlite3 filter=lfs diff=lfs merge=lfs -text

demo.py ADDED Viewed

	@@ -0,0 +1,116 @@

+import gradio as gr
+from dotenv import load_dotenv
+load_dotenv()
+# VectorIndexRetriever
+from llama_index.schema import NodeWithScore
+from llama_index import GPTVectorStoreIndex, ServiceContext
+from llama_index.storage import StorageContext
+from llama_index.vector_stores import ChromaVectorStore
+from llama_index.memory import ChatMemoryBuffer
+from llama_index.embeddings import HuggingFaceEmbedding
+import chromadb
+chroma_client = chromadb.PersistentClient(path="distilbert/")
+chroma_collection = chroma_client.get_or_create_collection("distilbert")
+vector_store = ChromaVectorStore(chroma_collection=chroma_collection)
+storage_context = StorageContext.from_defaults(vector_store=vector_store)
+embed_model = HuggingFaceEmbedding(model_name="distilbert-base-uncased")
+service_context = ServiceContext.from_defaults(embed_model=embed_model)
+index = GPTVectorStoreIndex.from_vector_store(
+    vector_store=vector_store,
+    storage_context=storage_context,
+    service_context=service_context
+)
+memory = ChatMemoryBuffer.from_defaults(token_limit=1000)
+chat_engine = index.as_chat_engine(
+    similarity_top_k=5,
+    chat_mode="context",
+    memory=memory,
+    system_prompt="You are an Artificial Intelligence (AI)-powered app called STAR " + \
+                  "(Standards Technical Assistance Resource) that could " + \
+                  "streamline the process and offer requirement " + \
+                  "recommendations, you can be used as copilot, to help " + \
+                  "mission designers blast off with even greater " + \
+                  "confidence, knowing that they have the right " + \
+                  "requirements in place. You should analyze and suggest " + \
+                  "improvements to a NASA standards."
+)
+query_engine = index.as_query_engine()
+retriever = index.as_retriever(
+    similarity_top_k=5,
+)
+THRESHOLD = 1e-9
+def inference(text, reset):
+    if text:
+        response = chat_engine.chat(text)
+        top_k_similar_nodes = retriever.retrieve(text)
+        to_view = []
+        for node in top_k_similar_nodes:
+            # print(node.get_score(), end = ' ')
+            if node.get_score() > THRESHOLD:
+                to_view.append((node.metadata()['file_name'], node.get_score()))
+            # to_view.append((node.metadata()['file_name'], node.get_score()))
+        references = ""
+        if len(to_view) > 0:
+            for i, t in enumerate(to_view):
+                filename, score = t
+                splits = filename.split('_')
+                page_number = int(splits[1])
+                original_document = ''.join(splits[3:])
+                references += f'{i + 1}- Document: ' + \
+                    f'{original_document[:-4]}, Page: ' + \
+                        f'{page_number} (Score: {score}).'
+                if i != len(to_view) - 1:
+                    references += '\n'
+        if reset:
+            memory.reset()
+        return response, references
+    elif reset:
+        memory.reset()
+    return "", ""
+examples = [
+    [
+        "How should the length-to-depth ratio of the initial flaw be " + \
+        "assumed when using the NASGRO® computer program for glass " + \
+        "structure analysis? Please provide a detailed procedure.",
+        True
+    ]
+]
+playground = gr.Interface(
+    fn=inference,
+    inputs=[
+        gr.Textbox(
+            value="Hello, who are you?",
+            label="Input",
+            info="Chat with STAR."
+        ),
+        gr.Checkbox(
+            label="Reset chat history",
+            info="Start a new conversation from scratch with STAR."
+        )
+    ],
+    outputs=[
+        gr.Textbox(
+            label="Response"
+        ),
+        gr.Textbox(
+            label="References"
+        )
+    ],
+    examples=examples,
+    cache_examples=True,
+    allow_flagging=False
+)
+playground.launch(share=True)

distilbert/88cf4ce2-b959-412a-9bef-3f16720e41fa/data_level0.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:23b875d0c9daae9e61adcd2c8db74630fd44f38b1409042455908fa07f718743
+size 51392000

distilbert/88cf4ce2-b959-412a-9bef-3f16720e41fa/header.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:90716667250485db3ae5cbd6d6794aafe244b85861ca79a632d92813b6fb5407
+size 100

distilbert/88cf4ce2-b959-412a-9bef-3f16720e41fa/index_metadata.pickle ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:811fdefc63959ca8c1c224917c80aad24cff9f5fa0d0c7f3c9b6a407d3885aa0
+size 926190

distilbert/88cf4ce2-b959-412a-9bef-3f16720e41fa/length.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b405bbc082fd52d8bb9351d7bec3d3f98acdfe03d96b891786e59aa0b8cfd273
+size 64000

distilbert/88cf4ce2-b959-412a-9bef-3f16720e41fa/link_lists.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2c7ab8525b2c907e225dedc7feb3d9e0dfdb2cedb417aa2f277ab219d6927e46
+size 136624

distilbert/chroma.sqlite3 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d7db200a30e658c17439694c9fcb339ac383b585b3eee4f939f510d2ac964247
+size 323895296

requirements.txt ADDED Viewed

	@@ -0,0 +1,171 @@

+absl-py==2.0.0
+aiofiles==23.2.1
+aiohttp==3.8.5
+aiosignal==1.3.1
+altair==5.1.2
+annotated-types==0.6.0
+anyio==3.7.1
+astunparse==1.6.3
+async-timeout==4.0.3
+attrs==23.1.0
+backoff==2.2.1
+bcrypt==4.0.1
+beautifulsoup4==4.12.2
+bs4==0.0.1
+cachetools==5.3.1
+certifi==2023.7.22
+charset-normalizer==3.3.0
+chroma-hnswlib==0.7.3
+chromadb==0.4.13
+click==8.1.7
+coloredlogs==15.0.1
+contourpy==1.1.1
+cycler==0.12.1
+dataclasses-json==0.6.1
+diskcache==5.6.3
+exceptiongroup==1.1.3
+fastapi==0.103.2
+ffmpy==0.3.1
+filelock==3.12.4
+flatbuffers==23.5.26
+fonttools==4.43.1
+frozenlist==1.4.0
+fsspec==2023.9.2
+gast==0.5.4
+google-auth==2.23.2
+google-auth-oauthlib==1.0.0
+google-pasta==0.2.0
+gradio==3.47.1
+gradio_client==0.6.0
+greenlet==3.0.0
+grpcio==1.59.0
+h11==0.14.0
+h5py==3.9.0
+httpcore==0.18.0
+httptools==0.6.0
+httpx==0.25.0
+huggingface-hub==0.17.3
+humanfriendly==10.0
+idna==3.4
+importlib-resources==6.1.0
+Jinja2==3.1.2
+joblib==1.3.2
+jsonpatch==1.33
+jsonpointer==2.4
+jsonschema==4.19.1
+jsonschema-specifications==2023.7.1
+keras==2.14.0
+kiwisolver==1.4.5
+langchain==0.0.310
+langsmith==0.0.43
+libclang==16.0.6
+llama-index==0.8.40
+llama_cpp_python==0.2.11
+Markdown==3.5
+MarkupSafe==2.1.3
+marshmallow==3.20.1
+matplotlib==3.8.0
+ml-dtypes==0.2.0
+monotonic==1.6
+mpmath==1.3.0
+multidict==6.0.4
+mypy-extensions==1.0.0
+nest-asyncio==1.5.8
+networkx==3.1
+nltk==3.8.1
+numpy==1.26.0
+nvidia-cublas-cu11==11.11.3.6
+nvidia-cublas-cu12==12.1.3.1
+nvidia-cuda-cupti-cu11==11.8.87
+nvidia-cuda-cupti-cu12==12.1.105
+nvidia-cuda-nvcc-cu11==11.8.89
+nvidia-cuda-nvrtc-cu12==12.1.105
+nvidia-cuda-runtime-cu11==11.8.89
+nvidia-cuda-runtime-cu12==12.1.105
+nvidia-cudnn-cu11==8.7.0.84
+nvidia-cudnn-cu12==8.9.2.26
+nvidia-cufft-cu11==10.9.0.58
+nvidia-cufft-cu12==11.0.2.54
+nvidia-curand-cu11==10.3.0.86
+nvidia-curand-cu12==10.3.2.106
+nvidia-cusolver-cu11==11.4.1.48
+nvidia-cusolver-cu12==11.4.5.107
+nvidia-cusparse-cu11==11.7.5.86
+nvidia-cusparse-cu12==12.1.0.106
+nvidia-nccl-cu11==2.16.5
+nvidia-nccl-cu12==2.18.1
+nvidia-nvjitlink-cu12==12.2.140
+nvidia-nvtx-cu12==12.1.105
+oauthlib==3.2.2
+onnxruntime==1.16.0
+openai==0.28.1
+opt-einsum==3.3.0
+orjson==3.9.7
+overrides==7.4.0
+packaging==23.2
+pandas==2.1.1
+Pillow==10.0.1
+posthog==3.0.2
+protobuf==4.24.4
+pulsar-client==3.3.0
+pyasn1==0.5.0
+pyasn1-modules==0.3.0
+pydantic==2.4.2
+pydantic_core==2.10.1
+pydub==0.25.1
+pyparsing==3.1.1
+pypdf==3.16.2
+PyPDF2==3.0.1
+PyPika==0.48.9
+python-dateutil==2.8.2
+python-dotenv==1.0.0
+python-multipart==0.0.6
+pytz==2023.3.post1
+PyYAML==6.0.1
+referencing==0.30.2
+regex==2023.10.3
+requests==2.31.0
+requests-oauthlib==1.3.1
+rpds-py==0.10.4
+rsa==4.9
+safetensors==0.4.0
+scikit-learn==1.3.1
+scipy==1.11.3
+semantic-version==2.10.0
+sentence-transformers==2.2.2
+sentencepiece==0.1.99
+six==1.16.0
+sniffio==1.3.0
+soupsieve==2.5
+SQLAlchemy==2.0.21
+starlette==0.27.0
+sympy==1.12
+tenacity==8.2.3
+tensorboard==2.14.1
+tensorboard-data-server==0.7.1
+tensorflow==2.14.0
+tensorflow-estimator==2.14.0
+tensorflow-io-gcs-filesystem==0.34.0
+tensorrt==8.5.3.1
+termcolor==2.3.0
+threadpoolctl==3.2.0
+tiktoken==0.5.1
+tokenizers==0.14.1
+toolz==0.12.0
+torch==2.1.0
+torchvision==0.16.0
+tqdm==4.66.1
+transformers==4.34.0
+triton==2.1.0
+typer==0.9.0
+typing-inspect==0.9.0
+typing_extensions==4.8.0
+tzdata==2023.3
+urllib3==1.26.17
+uvicorn==0.23.2
+uvloop==0.17.0
+watchfiles==0.20.0
+websockets==11.0.3
+Werkzeug==3.0.0
+wrapt==1.14.1
+yarl==1.9.2