Spaces:

Contentwise
/

langchain-streamlit-demo

Paused

App Files Files Community

fsal commited on Feb 1, 2024

Commit

c8ebe28

0 Parent(s):

first commit

Browse files

Files changed (42) hide show

.dockerignore +14 -0
.env-example +22 -0
.github/ISSUE_TEMPLATE/bug_report.md +38 -0
.github/ISSUE_TEMPLATE/feature_request.md +17 -0
.github/dependabot.yml +15 -0
.github/pull_request_template.md +13 -0
.github/workflows/ai_changelog.yml +48 -0
.github/workflows/bumpver.yml +40 -0
.github/workflows/check-file-size-limit.yml +14 -0
.github/workflows/docker-hub.yml +31 -0
.github/workflows/hf-space.yml +24 -0
.gitignore +90 -0
.idea/.gitignore +8 -0
.idea/.name +1 -0
.idea/inspectionProfiles/Project_Default.xml +21 -0
.idea/inspectionProfiles/profiles_settings.xml +6 -0
.idea/kubernetes-settings.xml +6 -0
.idea/langchain-streamlit-demo.iml +10 -0
.idea/misc.xml +10 -0
.idea/modules.xml +8 -0
.pre-commit-config.yaml +61 -0
AI_CHANGELOG.md +536 -0
Dockerfile +19 -0
LICENSE +9 -0
README.md +112 -0
bumpver.toml +18 -0
docker-compose.yml +16 -0
kubernetes/deploy.sh +19 -0
kubernetes/resources.yaml +118 -0
langchain-streamlit-demo/.streamlit/config.toml +6 -0
langchain-streamlit-demo/app.py +627 -0
langchain-streamlit-demo/defaults.py +134 -0
langchain-streamlit-demo/llm_resources.py +294 -0
langchain-streamlit-demo/python_coder.py +193 -0
langchain-streamlit-demo/qagen.py +72 -0
langchain-streamlit-demo/research_assistant/__init__.py +3 -0
langchain-streamlit-demo/research_assistant/chain.py +18 -0
langchain-streamlit-demo/research_assistant/search/__init__.py +0 -0
langchain-streamlit-demo/research_assistant/search/web.py +178 -0
langchain-streamlit-demo/research_assistant/writer.py +78 -0
langchain-streamlit-demo/summarize.py +66 -0
requirements.txt +23 -0

.dockerignore ADDED Viewed

	@@ -0,0 +1,14 @@

+.env
+.env-example
+.git/
+.github
+.gitignore
+.idea
+.mypy_cache
+.pre-commit-config.yaml
+.ruff_cache
+Dockerfile
+kubernetes
+docker-compose.yml
+junk/
+kubernetes/

.env-example ADDED Viewed

	@@ -0,0 +1,22 @@

+APP_PORT=7860
+LANGCHAIN_ENDPOINT="https://api.smith.langchain.com"
+LANGCHAIN_API_KEY="ls__..."
+LANGCHAIN_TRACING_V2="true"
+LANGCHAIN_PROJECT="streamlit_test"
+ANYSCALE_API_KEY="secret_..."
+OPENAI_API_KEY="sk-..."
+ANTHROPIC_API_KEY="sk-ant-..."
+DEFAULT_SYSTEM_PROMPT="You are a helpful chatbot."
+DEFAULT_MODEL="gpt-3.5-turbo"
+DEFAULT_TEMPERATURE=0.7
+MIN_TEMPERATURE=0.0
+MAX_TEMPERATURE=1.0
+DEFAULT_MAX_TOKENS=1000
+MIN_MAX_TOKENS=1
+MAX_MAX_TOKENS=100000

.github/ISSUE_TEMPLATE/bug_report.md ADDED Viewed

	@@ -0,0 +1,38 @@

+---
+name: Bug report
+about: Create a report to help us improve
+title: ''
+labels: bug
+assignees: ''
+---
+**Describe the bug**
+A clear and concise description of what the bug is.
+**To Reproduce**
+Steps to reproduce the behavior:
+1. Go to '...'
+2. Click on '....'
+3. Scroll down to '....'
+4. See error
+**Expected behavior**
+A clear and concise description of what you expected to happen.
+**Screenshots**
+If applicable, add screenshots to help explain your problem.
+**Desktop (please complete the following information):**
+ - OS: [e.g. iOS]
+ - Browser [e.g. chrome, safari]
+ - Version [e.g. 22]
+**Smartphone (please complete the following information):**
+ - Device: [e.g. iPhone6]
+ - OS: [e.g. iOS8.1]
+ - Browser [e.g. stock browser, safari]
+ - Version [e.g. 22]
+**Additional context**
+Add any other context about the problem here.

.github/ISSUE_TEMPLATE/feature_request.md ADDED Viewed

	@@ -0,0 +1,17 @@

+---
+name: Feature request
+about: Suggest an idea for this project
+title: ''
+labels: enhancement
+assignees: ''
+---
+**Describe the solution you'd like**
+A clear and concise description of what you want to happen.
+**Describe alternatives you've considered**
+A clear and concise description of any alternative solutions or features you've considered.
+**Additional context**
+Add any other context or screenshots about the feature request here.

.github/dependabot.yml ADDED Viewed

	@@ -0,0 +1,15 @@

+# To get started with Dependabot version updates, you'll need to specify which
+# package ecosystems to update and where the package manifests are located.
+# Please see the documentation for all configuration options:
+# https://docs.github.com/github/administering-a-repository/configuration-options-for-dependency-updates
+version: 2
+updates:
+  - package-ecosystem: "pip" # See documentation for possible values
+    directory: "/" # Location of package manifests
+    schedule:
+      interval: "weekly"
+    groups:
+      app:
+        patterns:
+          - "*"

.github/pull_request_template.md ADDED Viewed

	@@ -0,0 +1,13 @@

+Thank you for contributing!
+Before submitting this PR, please make sure:
+- [ ] Your code builds clean without any errors or warnings
+- [ ] Your code doesn't break anything we can't fix
+- [ ] You have added appropriate tests
+Please check one or more of the following to describe the nature of this PR:
+- [ ] New feature
+- [ ] Bug fix
+- [ ] Documentation
+- [ ] Other

.github/workflows/ai_changelog.yml ADDED Viewed

	@@ -0,0 +1,48 @@

+name: Update AI Changelog on Push to Main
+on:
+  push:
+    branches: [main]
+    paths-ignore:
+      - "AI_CHANGELOG.md"
+jobs:
+  update-changelog:
+    runs-on: ubuntu-latest
+    permissions:
+      contents: write
+      pull-requests: write
+    steps:
+    - name: Checkout code
+      uses: actions/checkout@v4
+      with:
+        token: ${{ secrets.WORKFLOW_GIT_ACCESS_TOKEN }}
+        fetch-depth: 0
+    - name: Set up Python
+      uses: actions/setup-python@v4
+      with:
+        python-version: 3.11
+        cache: pip
+    - name: Install Python libraries
+      run: |
+        pip install --user ai_changelog==0.0.9
+    - name: Execute script and prepend to AI_CHANGELOG.md
+      env:
+        OPENAI_API_KEY: ${{ secrets.OPENAI_API_KEY }}
+        LANGCHAIN_API_KEY: ${{ secrets.LANGCHAIN_API_KEY }}
+        LANGCHAIN_PROJECT: ai-changelog-langchain-streamlit-demo
+        LANGCHAIN_ENDPOINT: https://api.smith.langchain.com
+        LANGCHAIN_TRACING_V2: true
+      run: ai_changelog origin/main^..origin/main
+    - name: Commit changes
+      with:
+        COMMIT_MESSAGE: "Update AI Changelog"
+        file_pattern: "AI_CHANGELOG.md"
+      uses: stefanzweifel/git-auto-commit-action@v4

.github/workflows/bumpver.yml ADDED Viewed

	@@ -0,0 +1,40 @@

+name: Bump Version
+on:
+  workflow_dispatch:
+    inputs:
+      bump:
+        type: choice
+        description: 'Bump major, minor, or patch version'
+        required: true
+        default: 'patch'
+        options:
+        - 'major'
+        - 'minor'
+        - 'patch'
+jobs:
+  bump-version:
+    runs-on: ubuntu-latest
+    permissions:
+      contents: write
+    steps:
+    - name: Checkout code
+      uses: actions/checkout@v4
+      with:
+        token: ${{ secrets.WORKFLOW_GIT_ACCESS_TOKEN }}
+        fetch-depth: 0
+    - name: Set up Python
+      uses: actions/setup-python@v4
+      with:
+        python-version: 3.11
+        cache: pip
+    - name: Install Python libraries
+      run: |
+        pip install --user bumpver
+    - name: git config
+      run: |
+        git config --local user.email "41898282+github-actions[bot]@users.noreply.github.com"
+        git config --local user.name "github-actions[bot]"
+    - name: Bump version
+      run: bumpver update --commit --tag-commit --${{ github.event.inputs.bump }} --push

.github/workflows/check-file-size-limit.yml ADDED Viewed

	@@ -0,0 +1,14 @@

+name: 10 MB file size limit
+on:
+  pull_request:
+    branches: [main]
+jobs:
+  check-file-sizes:
+    runs-on: ubuntu-latest
+    steps:
+      - name: Check large files
+        uses: ActionsDesk/lfs-warning@v2.0
+        with:
+          filesizelimit: 10485760 # this is 10MB so we can sync to HF Spaces
+          token: ${{ secrets.WORKFLOW_GIT_ACCESS_TOKEN }}

.github/workflows/docker-hub.yml ADDED Viewed

	@@ -0,0 +1,31 @@

+name: Push to Docker Hub
+on:
+  push:
+    tags:
+      - '*.*.*'
+jobs:
+  build-and-push-docker:
+    runs-on: ubuntu-latest
+    steps:
+    - uses: actions/checkout@v2
+      with:
+        fetch-depth: 0
+        token: ${{ secrets.WORKFLOW_GIT_ACCESS_TOKEN }}
+    - name: Log in to Docker Hub
+      uses: docker/login-action@v1
+      with:
+        username: joshuasundance
+        password: ${{ secrets.DOCKERHUB_TOKEN }}
+    - name: Build Docker image
+      run: |
+        docker build \
+          -t joshuasundance/langchain-streamlit-demo:${{ github.ref_name }} \
+          -t joshuasundance/langchain-streamlit-demo:latest \
+          .
+    - name: Push to Docker Hub
+      run: docker push -a joshuasundance/langchain-streamlit-demo

.github/workflows/hf-space.yml ADDED Viewed

	@@ -0,0 +1,24 @@

+name: Push to HuggingFace Space
+on:
+  workflow_run:
+    workflows: ["Update AI Changelog on Push to Main"]
+    branches: [main]
+    types:
+      - completed
+  workflow_dispatch:
+jobs:
+  push-to-huggingface:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v2
+        with:
+          fetch-depth: 0
+          token: ${{ secrets.WORKFLOW_GIT_ACCESS_TOKEN }}
+      - name: Push to HuggingFace Space
+        env:
+          HF_TOKEN: ${{ secrets.HF_TOKEN }}
+        run: |
+          git push https://contentwise:$HF_TOKEN@huggingface.co/spaces/contentwise/langchain-streamlit-demo main

.gitignore ADDED Viewed

	@@ -0,0 +1,90 @@

+*$py.class
+*.chainlit
+*.chroma
+*.cover
+*.egg
+*.egg-info/
+*.env
+*.langchain.db
+*.log
+*.manifest
+*.mo
+*.pot
+*.py,cover
+*.py[cod]
+*.sage.py
+*.so
+*.spec
+.DS_STORE
+.Python
+.cache
+.coverage
+.coverage.*
+.dmypy.json
+.eggs/
+.env
+.hypothesis/
+.installed.cfg
+.ipynb_checkpoints
+.mypy_cache/
+.nox/
+.pyre/
+.pytest_cache/
+.python-version
+.ropeproject
+.ruff_cache/
+.scrapy
+.spyderproject
+.spyproject
+.tox/
+.venv
+.vscode
+.webassets-cache
+/site
+ENV/
+MANIFEST
+__pycache__
+__pycache__/
+__pypackages__/
+build/
+celerybeat-schedule
+celerybeat.pid
+coverage.xml
+credentials.json
+data/
+db.sqlite3
+db.sqlite3-journal
+develop-eggs/
+dist/
+dmypy.json
+docs/_build/
+downloads/
+eggs/
+env.bak/
+env/
+fly.toml
+htmlcov/
+instance/
+ipython_config.py
+junk/
+lib/
+lib64/
+local_settings.py
+models/*.bin
+nosetests.xml
+notebooks/scratch/
+parts/
+pip-delete-this-directory.txt
+pip-log.txt
+pip-wheel-metadata/
+profile_default/
+sdist/
+share/python-wheels/
+storage
+target/
+token.json
+var/
+venv
+venv.bak/
+venv/
+wheels/

.idea/.gitignore ADDED Viewed

	@@ -0,0 +1,8 @@

+# Default ignored files
+/shelf/
+/workspace.xml
+# Editor-based HTTP Client requests
+/httpRequests/
+# Datasource local storage ignored files
+/dataSources/
+/dataSources.local.xml

.idea/.name ADDED Viewed

	@@ -0,0 +1 @@


1	+ langchain-streamlit-demo

.idea/inspectionProfiles/Project_Default.xml ADDED Viewed

	@@ -0,0 +1,21 @@

+<component name="InspectionProjectProfileManager">
+  <profile version="1.0">
+    <option name="myName" value="Project Default" />
+    <inspection_tool class="Eslint" enabled="true" level="WARNING" enabled_by_default="true" />
+    <inspection_tool class="InconsistentLineSeparators" enabled="true" level="WARNING" enabled_by_default="true" />
+    <inspection_tool class="PyCompatibilityInspection" enabled="true" level="WARNING" enabled_by_default="true">
+      <option name="ourVersions">
+        <value>
+          <list size="5">
+            <item index="0" class="java.lang.String" itemvalue="3.12" />
+            <item index="1" class="java.lang.String" itemvalue="3.8" />
+            <item index="2" class="java.lang.String" itemvalue="3.9" />
+            <item index="3" class="java.lang.String" itemvalue="3.10" />
+            <item index="4" class="java.lang.String" itemvalue="3.11" />
+          </list>
+        </value>
+      </option>
+    </inspection_tool>
+    <inspection_tool class="PyShadowingNamesInspection" enabled="false" level="WEAK WARNING" enabled_by_default="false" />
+  </profile>
+</component>

.idea/inspectionProfiles/profiles_settings.xml ADDED Viewed

	@@ -0,0 +1,6 @@

+<component name="InspectionProjectProfileManager">
+  <settings>
+    <option name="USE_PROJECT_PROFILE" value="false" />
+    <version value="1.0" />
+  </settings>
+</component>

.idea/kubernetes-settings.xml ADDED Viewed

	@@ -0,0 +1,6 @@

+<?xml version="1.0" encoding="UTF-8"?>
+<project version="4">
+  <component name="KubernetesSettings">
+    <option name="contextName" value="swca-aks" />
+  </component>
+</project>

.idea/langchain-streamlit-demo.iml ADDED Viewed

	@@ -0,0 +1,10 @@

+<?xml version="1.0" encoding="UTF-8"?>
+<module type="PYTHON_MODULE" version="4">
+  <component name="NewModuleRootManager">
+    <content url="file://$MODULE_DIR$">
+      <sourceFolder url="file://$MODULE_DIR$/langchain-streamlit-demo" isTestSource="false" />
+    </content>
+    <orderEntry type="jdk" jdkName="Remote Python 3.11.4 Docker (&lt;none&gt;:&lt;none&gt;) (5)" jdkType="Python SDK" />
+    <orderEntry type="sourceFolder" forTests="false" />
+  </component>
+</module>

.idea/misc.xml ADDED Viewed

	@@ -0,0 +1,10 @@

+<?xml version="1.0" encoding="UTF-8"?>
+<project version="4">
+  <component name="Black">
+    <option name="sdkName" value="Remote Python 3.11.4 Docker (&lt;none&gt;:&lt;none&gt;) (5)" />
+  </component>
+  <component name="ProjectRootManager" version="2" project-jdk-name="Remote Python 3.11.4 Docker (&lt;none&gt;:&lt;none&gt;) (5)" project-jdk-type="Python SDK" />
+  <component name="PythonCompatibilityInspectionAdvertiser">
+    <option name="version" value="3" />
+  </component>
+</project>

.idea/modules.xml ADDED Viewed

	@@ -0,0 +1,8 @@

+<?xml version="1.0" encoding="UTF-8"?>
+<project version="4">
+  <component name="ProjectModuleManager">
+    <modules>
+      <module fileurl="file://$PROJECT_DIR$/.idea/langchain-streamlit-demo.iml" filepath="$PROJECT_DIR$/.idea/langchain-streamlit-demo.iml" />
+    </modules>
+  </component>
+</project>

.pre-commit-config.yaml ADDED Viewed

	@@ -0,0 +1,61 @@

+# Don't know what this file is? See https://pre-commit.com/
+#   pip install pre-commit
+#   pre-commit install
+#   pre-commit autoupdate
+# Apply to all files without commiting:
+#   pre-commit run --all-files
+#   I recommend running this until you pass all checks, and then commit.
+#   Fix what you need to and then let the pre-commit hooks resolve their conflicts.
+#   You may need to git add -u between runs.
+exclude: "AI_CHANGELOG.md"
+repos:
+-   repo: https://github.com/charliermarsh/ruff-pre-commit
+    rev: "v0.1.8"
+    hooks:
+    -   id: ruff
+        args: [--fix, --exit-non-zero-on-fix, --ignore, E501]
+-   repo: https://github.com/koalaman/shellcheck-precommit
+    rev: v0.9.0
+    hooks:
+    -   id: shellcheck
+-   repo: https://github.com/pre-commit/pre-commit-hooks
+    rev: v4.5.0
+    hooks:
+    -   id: check-ast
+    -   id: check-builtin-literals
+    -   id: check-merge-conflict
+    -   id: check-symlinks
+    -   id: check-toml
+    -   id: check-xml
+    -   id: debug-statements
+    -   id: check-case-conflict
+    -   id: check-docstring-first
+    -   id: check-executables-have-shebangs
+    -   id: check-json
+#    -   id: check-yaml
+    -   id: debug-statements
+    -   id: fix-byte-order-marker
+    -   id: detect-private-key
+    -   id: end-of-file-fixer
+    -   id: trailing-whitespace
+    -   id: mixed-line-ending
+    -   id: requirements-txt-fixer
+-   repo: https://github.com/psf/black
+    rev: 23.12.0
+    hooks:
+    -   id: black
+-   repo: https://github.com/asottile/add-trailing-comma
+    rev: v3.1.0
+    hooks:
+    -   id: add-trailing-comma
+-   repo: https://github.com/pre-commit/mirrors-mypy
+    rev: v1.7.1
+    hooks:
+    -   id: mypy
+        additional_dependencies:
+            - types-requests
+-   repo: https://github.com/PyCQA/bandit
+    rev: 1.7.6
+    hooks:
+    -   id: bandit
+        args: ["-x", "tests/*.py", "-s", "B113"]

AI_CHANGELOG.md ADDED Viewed

	@@ -0,0 +1,536 @@

+# AI CHANGELOG
+## [Updated Python dependencies](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/511218395a883d498a66e4c136be25c110434b2a)
+Mon Jan 29 12:14:25 2024 +0000
+- The Python dependencies in the requirements.txt file have been updated. The following packages were upgraded: anthropic, black, duckduckgo-search, langchain, langsmith, numexpr, openai, and pypdf.
+## [Updated langchain package version](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/997c45707653d2b35465402714e289b56033f1e7)
+Mon Jan 1 13:05:22 2024 +0000
+- The langchain package version in the requirements.txt file has been updated from 0.0.352 to 0.0.353.
+## [Refactor and improve documentation for assistant tools](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/bd1f3d1c1d1c34d960051bdd37370ddba520b665)
+Wed Dec 27 19:28:06 2023 -0500
+- This commit includes several changes to improve the structure and documentation of the assistant tools used in the Streamlit app. The changes include:
+- 1. Reordering of import statements for better readability and organization.
+- 2. Refactoring of the research_assistant_tool, python_coder_tool, doc_chain_tool, and doc_question_tool functions to improve their documentation. The new documentation provides clearer instructions for use and sets more explicit expectations for the type of input these tools should receive.
+- 3. Adjustments to the order of tools in the TOOLS list to ensure the doc_question_tool is prioritized.
+## [Updated application version to 2.1.4](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/13a5813ecd2f6bdfbc39bd2c50bdd36c43162733)
+Wed Dec 27 16:25:25 2023 +0000
+- The application version has been updated from 2.1.3 to 2.1.4 in multiple files: bumpver.toml, resources.yaml, and app.py. This change includes updating the current_version in bumpver.toml, the Docker image tag in the Kubernetes resources file, and the __version__ attribute in the app.py file.
+## [Updated chat input formatting in python_coder.py](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/39161d38df2e230a22fcc7b1eda31e486d989728)
+Wed Dec 27 11:22:28 2023 -0500
+- This commit changes the way user input is displayed in the chat history. Previously, a colon was prepended to user input. This has been removed to improve readability.
+## [Refactor Tool creation and usage in langchain-streamlit-demo](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/f4b7ac3592a6b55c09bf3b2c7692467410d63687)
+Wed Dec 27 11:21:00 2023 -0500
+- This commit refactors the way tools are created and used within the langchain-streamlit-demo. The 'Tool' class has been replaced by a 'tool' decorator, making the code more Pythonic and easier to read.
+- The 'research_assistant_tool', 'python_coder_tool', 'doc_chain_tool', and 'doc_question_tool' have all been updated to use this new decorator. This change also allows for the 'callbacks' parameter to be passed directly to the tool functions, improving flexibility.
+- The 'description' attribute of each tool has been moved inside the function as a docstring, providing context about what each tool does in a more standard Python way.
+## [Changed default value of 'strict' parameter in check_mypy function](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/238a2a143b60d9ed340de283864a99f99bd0b0bc)
+Wed Dec 27 10:54:14 2023 -0500
+- The 'strict' parameter in the 'check_mypy' function has been modified. Previously, the default value was set to 'True'. This commit changes the default value to 'False'. This change affects how mypy checks are run on a file.
+## [Extended subprocess timeouts and added no-cache option to ruff commands](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/f642d160e47dd94a51437ab57aa4757aabd013b6)
+Wed Dec 27 10:53:23 2023 -0500
+- Increased the timeout for subprocess commands from 3 seconds to 30 seconds to allow for longer processes. Added the '--no-cache' option to all 'ruff' commands to ensure that the most recent version of the file is being checked and formatted. Additionally, imported 'MessagesPlaceholder' from 'langchain.prompts' and added it to the 'ChatPromptTemplate' to include the chat history in the prompt.
+## [Added ConversationBufferMemory to agent](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/bc3a159a9e104625425de5578e0e060f12e6fe83)
+Wed Dec 27 10:40:41 2023 -0500
+- The ConversationBufferMemory was imported from the langchain.memory module and added to the agent. This change will enable the agent to store the conversation history, allowing it to respond more accurately to user inputs based on previous interactions.
+## [Bumped application version from 2.1.2 to 2.1.3](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/4c0a3bf81f9ddf898312804522c6b3f084bfa289)
+Wed Dec 27 04:30:24 2023 +0000
+- The 'current_version' field in 'bumpver.toml' was updated from 2.1.2 to 2.1.3, indicating a new version of the application.
+- In 'kubernetes/resources.yaml', the image version for 'langchain-streamlit-demo' container was updated to match the new version.
+- The '__version__' variable in 'app.py' under 'langchain-streamlit-demo' was also updated to reflect the new version.
+## [Added git configuration to GitHub Actions workflow](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/090173a3ba6868f868a9b707d657b4f180537c80)
+Tue Dec 26 23:28:58 2023 -0500
+- This commit introduces changes to the GitHub Actions workflow. Specifically, it adds a git configuration step to set the user email and name to 'github-actions[bot]'. This is important as it ensures that the bot is recognized as the author of any commits made during the workflow process.
+## [Added choice type to bump input in GitHub Actions workflow](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/414e3d472d9eda092b0fde7ee76d22fb033b837d)
+Tue Dec 26 23:12:25 2023 -0500
+- This commit modifies the 'bumpver.yml' file in our GitHub Actions workflow. Specifically, it adds a 'choice' type to the 'bump' input. This change ensures that the user can only select from predefined options when triggering the version bump workflow, thus minimizing the chance of errors.
+## [Added GitHub Actions Workflow for Version Bumping](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/6a47e1364d6f23b201ed7ae277698ada08793617)
+Tue Dec 26 23:11:03 2023 -0500
+- This commit introduces a new GitHub Actions workflow named 'Bump Version'.
+- The workflow can be manually triggered and requires an input to specify whether to bump the major, minor, or patch version of the project.
+- The job within the workflow runs on the latest Ubuntu, checks out the code, sets up Python 3.11, installs the 'bumpver' Python library, and then uses this library to bump the specified version.
+- The updated version is then committed and tagged, and the changes are pushed back to the repository.
+## [Updated package versions in requirements.txt](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/cd6528dd9a52049f0551411c148a7e7b0d3af0e9)
+Mon Dec 25 12:11:03 2023 +0000
+- This commit updates the versions of several packages in the requirements.txt file. The packages updated include: anthropic, black, duckduckgo-search, langchain, langsmith, mypy, openai, and pypdf. The purpose of these updates is to keep the project's dependencies up-to-date with the latest versions.
+## [Enabled config callbacks and updated tool descriptions](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/aa82c149b06608f987e7f8ff3882ed4fc53ed6e6)
+Tue Dec 19 16:18:20 2023 -0600
+- The commit enables the `get_config(callbacks)` within the `doc_chain_tool` and `doc_question_tool` functions. This allows the functions to use the specified config callbacks.
+- It also updates the description of the `doc_question_tool` to clarify its usage and warn users not to send anything other than a question as it already has context.
+## [Updated versions of pre-commit hooks](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/7c729a3108c70efd5707ec4631d55e67f2968f8e)
+Tue Dec 19 16:43:48 2023 -0500
+- This commit updates the versions of multiple pre-commit hooks. The updated hooks include 'ruff-pre-commit' (from v0.0.291 to v0.1.8), 'pre-commit-hooks' (from v4.4.0 to v4.5.0), 'black' (from 23.9.1 to 23.12.0), 'mirrors-mypy' (from v1.5.1 to v1.7.1), and 'bandit' (from 1.7.5 to 1.7.6).
+- These updates ensure that the project is using the most recent and secure versions of these tools, which can help to catch more potential issues during the pre-commit phase.
+## [Removed vcs.xml and updated default agent type in llm_resources.py](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/71e9279d36d4c78c6b18956c598445f6caf2ced6)
+Tue Dec 19 16:10:18 2023 -0500
+- The vcs.xml file, which was used for version control settings in the IDE, has been deleted. This indicates a change in the version control system or its configuration.
+- In the llm_resources.py file, the default agent type for the get_doc_agent function has been changed from STRUCTURED_CHAT_ZERO_SHOT_REACT_DESCRIPTION to CHAT_ZERO_SHOT_REACT_DESCRIPTION. This suggests a change in how the agent responds in chat scenarios.
+## [Updated several package versions in requirements.txt](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/1cf958abefb5cd3408fac7c64d96ecf6f3d62a28)
+Tue Dec 19 18:26:07 2023 +0000
+- The versions of the following packages were updated: anthropic (from 0.7.8 to 0.8.0), duckduckgo-search (from 4.0.0 to 4.1.0), langchain (from 0.0.350 to 0.0.351), and langsmith (from 0.0.71 to 0.0.72).
+## [Introduced document-agent and enhanced user-document-chat](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/f88e711dc42403046604176f8eaa3ec716572cd7)
+Tue Dec 19 12:12:02 2023 -0600
+- This commit introduces the 'document-agent' tool which uses the 'doc_chain_agent' to return a response based on the user's custom context. It is recommended to use this tool when the user's question is complex, as it attempts to break it down into simpler questions.
+- The 'user-document-chat' tool has been enhanced to return a response based on the user's custom context. It is advised to use this tool before conducting web research.
+- A new function 'get_doc_agent' has been added in the 'llm_resources.py' file. This function initializes an agent with the given tools and a language model. The agent assists a chatbot with answering questions about a document. It breaks up incoming questions into multiple parts, and uses the tools provided to answer smaller questions before answering the larger question.
+## [Updated Dependabot configuration](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/4e2d2fd2be93bc022093064214e372833debd235)
+Tue Dec 19 13:24:43 2023 -0500
+- Added a new group 'app' in the Dependabot configuration file to include all dependencies ('*'). This will group updates for all dependencies together.
+## [Refactor Memory Management and Remove Intermediate Steps](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/3a2b820bcfb7ef8dc4157626de454be9267e1e91)
+Tue Dec 19 09:35:23 2023 -0500
+- This commit refactors the memory management in the Streamlit app and other resources. It replaces the 'AgentTokenBufferMemory' with 'ConversationBufferMemory' for a more efficient memory usage. The 'return_messages' flag is set to 'True' in the new memory management system.
+- The commit also disables the return of intermediate steps in both the Streamlit app and agent execution by setting 'return_intermediate_steps' to 'False'. This change can help to improve performance by reducing unnecessary computations.
+- Furthermore, the commit simplifies the 'python_coder.py' script by removing unnecessary imports and argument parsing related to 'black', 'ruff', and 'mypy'. It also removes the main execution block, indicating that this script may now be used as a module rather than a standalone script.
+- The changes in this commit aim to improve performance and maintainability of the code.
+## [Updated application version to 2.1.2](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/3fddfc9d34f66f92255f6a0d0878e20db401d694)
+Mon Dec 18 11:02:13 2023 -0500
+- Bumped the current version of the application in the bumpver.toml file from 2.1.1 to 2.1.2.
+- Updated the version of the Docker image used in the Kubernetes resources.yaml file from 2.1.1 to 2.1.2.
+- Changed the __version__ variable in the app.py file of the langchain-streamlit-demo application from 2.1.1 to 2.1.2.
+## [Added PythonCompatibilityInspectionAdvertiser to misc.xml and updated agent_type in python_coder.py](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/04cf693d125a71f61b12ce8f5f8024c79fe9908c)
+Mon Dec 18 10:59:56 2023 -0500
+- In the misc.xml file, a new component 'PythonCompatibilityInspectionAdvertiser' was added to the project. This component is used for inspecting python compatibility.
+- In the python_coder.py file, the default value for the 'agent_type' argument in the 'get_agent' function was changed from 'OPENAI_FUNCTIONS' to 'CHAT_CONVERSATIONAL_REACT_DESCRIPTION'. This change affects the type of agent that is initialized by default when the 'get_agent' function is called.
+## [Bumped version from 2.1.0 to 2.1.1](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/5a348f9029a30b49eda60ed7b6d612f9602c8bc8)
+Mon Dec 18 10:41:42 2023 -0500
+- The current version number in bumpver.toml, the image tag in kubernetes/resources.yaml, and the __version__ variable in langchain-streamlit-demo/app.py have all been updated from 2.1.0 to 2.1.1.
+## [Update PyPDF package version](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/fc63706a675b02d7b7db5bb31b81d14da3f17bed)
+Mon Dec 18 13:16:53 2023 +0000
+- This commit updates the version of the PyPDF package from 3.17.2 to 3.17.3 in the requirements.txt file.
+## [Updated langsmith package](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/688f2b15a1d6086d6c81ae06f27495421641ac20)
+Mon Dec 18 13:15:37 2023 +0000
+- The langsmith package has been updated from version 0.0.69 to 0.0.71 in the requirements.txt file.
+## [Updated anthropic package version](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/d0fdfb5eaa95b1628140a0a1650d416220070fb4)
+Mon Dec 18 13:15:24 2023 +0000
+- The anthropic package in the requirements.txt file has been updated from version 0.7.7 to 0.7.8. No other packages were affected in this commit.
+## [Updated OpenAI library version](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/4c03ff5ea6f5c3097a53e0c0c5db36967d5e1e8f)
+Mon Dec 18 13:13:17 2023 +0000
+- The OpenAI library version in requirements.txt has been updated from 1.3.8 to 1.5.0. This update may include new features, bug fixes, and performance improvements.
+## [Updated langchain version](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/00528c803be2d7b84bedf1d5469d269529e8a3db)
+Mon Dec 18 12:13:48 2023 +0000
+- The langchain package was updated from version 0.0.348 to 0.0.350 in the requirements.txt file. This change was necessary to incorporate the latest features and bug fixes from the langchain package.
+## [Updated application version to 2.1.0](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/6a5206daa0170076d2e55f3878204571c03b0dbe)
+Wed Dec 13 17:57:20 2023 -0500
+- The version of the application has been updated from 2.0.1 to 2.1.0. This change is reflected in the bumpver.toml file, which tracks the current version of the application.
+- In addition, the Docker image referenced in the Kubernetes resource configuration file (resources.yaml) has been updated to match the new version.
+- Finally, the version number displayed on the application's Streamlit page (app.py) has also been updated to reflect the new version.
+## [Added Python Coder Assistant to Application Tools](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/94f9b82dcf0b254853e489743d140c674acb2bb6)
+Wed Dec 13 17:54:48 2023 -0500
+- In this commit, a Python Coder Assistant was added to the application's tools. This assistant is capable of writing Python code given clear instructions and requirements. It was implemented by importing the 'get_agent' function from the newly created 'python_coder.py' file and adding the resulting 'python_coder_tool' to the 'TOOLS' list.
+- The 'python_coder.py' file contains the necessary functions and classes to initialize the Python Coder Assistant, check the code, and submit the code. It also ensures that the code conforms to the black, ruff, and strict mypy standards.
+- The 'requirements.txt' file was updated to include the new dependencies required by the Python Coder Assistant, namely 'black', 'mypy', and 'ruff'.
+## [Added certifi and requests packages to requirements.txt](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/920ffd4c80beac16450c762c3caab609ede20fd0)
+Wed Dec 13 18:16:18 2023 +0000
+- The certifi and requests packages were added to the requirements.txt file to avoid potential vulnerabilities. These packages were not directly required, but were pinned by Snyk for security reasons.
+## [Enhanced tool descriptions and added 'llm-math' tool](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/13d332463cb60b873e75f45f783ca23cef55de93)
+Wed Dec 13 13:09:22 2023 -0500
+- The commit enhances the descriptions of the 'web-research-assistant' and 'user-document-chat' tools. It also adds the 'llm-math' tool to the default tools list in the 'app.py' file of the 'langchain-streamlit-demo' project.
+- In the 'requirements.txt' file, the 'numexpr' package (version 2.8.8) has been added.
+## [Added tool loading functionality and updated assistant description](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/d8714b091e4b40041ac26cd8a2854e5ef34011cb)
+Wed Dec 13 10:35:50 2023 -0500
+- In this commit, the developer has added a line to load additional tools using the 'load_tools' function from the 'langchain.agents' module. This extends the functionality of the default tools available in the application.
+- Additionally, the developer has updated the description of the 'web-research-assistant' tool to provide more context on its usage and cost implications. The updated description advises users to use the assistant sparingly due to its relative expense and suggests using DuckDuckGo for quick facts instead.
+## [Bumped version from 2.0.0 to 2.0.1](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/9e698f4a274c4780d013fdfb0110a1f7675b580e)
+Wed Dec 13 14:10:39 2023 +0000
+- This commit updates the version number across several files. Specifically, it modifies the current version in bumpver.toml, the image version in the Kubernetes resources.yaml, and the __version__ variable in the langchain-streamlit-demo/app.py. All these changes reflect the version bump from 2.0.0 to 2.0.1.
+## [Improved chat message display in Streamlit app](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/f15299ef4c3f6d17e1fed55329d9be2683e3e6de)
+Wed Dec 13 09:08:41 2023 -0500
+- This commit updates the chat history section of the Streamlit app. It adds a check to ensure that a message is only displayed if it has content and is of a recognized type ('ai', 'assistant', 'human', 'user'). This prevents empty or unhandled message types from being displayed, improving the user experience.
+## [Update version to 2.0.0](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/870f9c796ca452f131df63efeb5fd22f41b35cb3)
+Tue Dec 12 17:23:25 2023 -0500
+- The version number in bumpver.toml, kubernetes resources.yaml, and app.py has been updated from 1.1.0 to 2.0.0. This includes updates to the current version in the bumpver configuration, the docker image version in the Kubernetes resources file, and the application version in the app.py file.
+## [Added new search tools and updated assistant descriptions](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/1ea3b530f16118973e99729685e5e0be621e8a91)
+Tue Dec 12 17:03:20 2023 -0500
+- Added DuckDuckGoSearchRun and WikipediaQueryRun to the default tools. Updated the description of 'web-research-assistant' to mention quick facts usage of DuckDuckGo. Also, added these tools to the TOOLS list in the provider's condition.
+- Updated the DEFAULT_SYSTEM_PROMPT in defaults.py to emphasize a step-by-step approach.
+- Added 'wikipedia==1.4.0' to the requirements.txt file for using the Wikipedia API.
+## [Updated pre-commit hooks and refactored Streamlit app](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/5825ff944afc97081a1cc740d0ccf3095a80d697)
+Tue Dec 12 16:03:57 2023 -0500
+- 1. Updated the pre-commit configuration file to reorder the hooks, replacing the 'mypy' hook with the 'black' hook and vice versa.
+- 2. Refactored the Streamlit application 'app.py' by adding a new import statement and restructuring the code for better readability and performance. This includes changes in the way the 'research_assistant_tool' and 'doc_chain_tool' are defined and used, and the addition of the 'get_config' function for creating a configuration dictionary.
+- 3. Updated the 'llm_resources.py' file to include 'callbacks' as an argument in the 'get_agent' function, and removed the 'create_retriever_tool' usage from the 'get_runnable' function.
+## [Added TODO comments for future development](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/547d578fa19e7542737e6165e21b93c0369f5f4f)
+Tue Dec 12 14:50:49 2023 -0500
+- This commit includes TODO comments in the app.py file of the langchain-streamlit-demo. These comments outline future development tasks related to the usage of agents in the OpenAI or Azure OpenAI, the usage of runnable, and the addition of these to tools.
+## [Added web research assistant and updated dependencies](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/883f3bee29ccd1f670e48245d3ada8d1fd7fd3c9)
+Tue Dec 12 14:48:04 2023 -0500
+- Added a web research assistant that uses DuckDuckGo's search API to perform web searches and BeautifulSoup to scrape text from the resulting URLs. The assistant then generates a report based on the scraped information.
+- Updated the pre-commit configuration to add a dependency on 'types-requests'.
+- Refactored the 'get_runnable' function in 'llm_resources.py' to use the new 'get_agent' function, which creates an agent with a set of tools and a chat history.
+- Updated 'app.py' to use the new web research assistant, and refactored the code to use the new 'get_agent' function.
+- Updated the requirements file to include 'beautifulsoup4' and 'duckduckgo-search'.
+## [Enhanced chat functionality in the LLMChain](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/048798b27efb2d8dbe52648fdcf34176a608a296)
+Tue Dec 12 14:01:20 2023 -0500
+- This commit introduces an enhancement to the chat functionality in the LLMChain. It does so by incorporating the chat history into the get_runnable function. The commit also restructures the import statements in the llm_resources.py file and adds new imports necessary for the enhancement.
+- The get_runnable function now takes an additional parameter 'chat_history'. It creates a retriever tool and an OpenAIFunctionsAgent with a prompt that includes system messages and the chat history. An AgentTokenBufferMemory is also initialized with the chat history.
+- The agent and the tools are then executed using an AgentExecutor that returns the output of the conversation. This enhancement allows the chatbot to maintain a history of the conversation and use it to provide more context-aware responses.
+## [Updated version from 1.0.3 to 1.1.0](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/f9ace4d1dc84d8acfab5d95c489b461362d680d0)
+Mon Dec 11 12:36:57 2023 -0500
+- The version number in bumpver.toml, kubernetes/resources.yaml, and langchain-streamlit-demo/app.py has been updated from 1.0.3 to 1.1.0.
+- In bumpver.toml, the current_version key's value is updated.
+- In kubernetes/resources.yaml, the image version of the langchain-streamlit-demo container is updated.
+- In langchain-streamlit-demo/app.py, the __version__ variable is updated.
+## [Removed BM25Retriever and related dependencies](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/c132355839f407ff11494aeee4ff361a7646e913)
+Mon Dec 11 12:31:16 2023 -0500
+- In this commit, the use of the BM25Retriever and its related dependencies were removed from the project. This included changes in the 'app.py' and 'llm_resources.py' files where the retriever was being used. The 'get_texts_and_retriever' function was removed from 'llm_resources.py' as it was no longer needed. Additionally, the 'rank_bm25' library was removed from the project's requirements in the 'requirements.txt' file.
+## [Updated retriever function and imports in app.py and llm_resources.py](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/e8b1107dfef3f5b1bb104b9e4d1f98095a2228ff)
+Mon Dec 11 10:27:19 2023 -0600
+- In the app.py file, the import statement was updated to include the 'get_texts_and_multiretriever' function from the 'llm_resources' module. The function 'get_texts_and_retriever_cacheable_wrapper' was also updated to call 'get_texts_and_multiretriever' instead of 'get_texts_and_retriever'.
+- In the llm_resources.py file, the function 'get_texts_and_retriever2' was renamed to 'get_texts_and_multiretriever'.
+## [Updated OpenAI package version](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/cc740341e378b46896457ff83048b981ff8eadc2)
+Mon Dec 11 12:44:43 2023 +0000
+- The OpenAI package version in requirements.txt was updated from 1.3.7 to 1.3.8.
+## [Updated pypdf version](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/d880411e5d768b13efb25d3d7ac4ead6755a4ff0)
+Mon Dec 11 12:44:36 2023 +0000
+- The pypdf package version in requirements.txt was updated from 3.17.1 to 3.17.2. This change doesn't affect any other dependencies.
+## [Updated langchain version in requirements](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/f23ab029e9e13452f9fe0e41ed48f36f257cdbfb)
+Mon Dec 11 12:44:32 2023 +0000
+- The version of langchain in the requirements.txt file was updated from 0.0.345 to 0.0.348. No other changes were made.
+## [Added new retriever function and updated langchain version](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/09bee796cc0e56bf167cff0d12cbdb233184c376)
+Fri Dec 8 15:20:41 2023 -0600
+- In the langchain-streamlit-demo/llm_resources.py file, a new function called get_texts_and_retriever2 was added. This function processes uploaded file bytes and returns a list of documents and a BaseRetriever instance. It introduces new retriever classes MultiVectorRetriever and MultiQueryRetriever, and uses InMemoryStore for storage. Also, it generates unique identifiers for each text using the uuid library.
+- In the requirements.txt file, the version of the langchain package was updated from 0.0.345 to 0.0.346.
+## [Updated Azure endpoint configuration in embeddings_kwargs](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/56dd4e0c90ab9ec09be58c184e6bf100398c9be8)
+Thu Dec 7 11:00:31 2023 -0500
+- This commit modifies the 'get_texts_and_retriever' function in the 'llm_resources.py' file.
+- If 'use_azure' is True and 'azure_kwargs' is provided, the 'azure_endpoint' is now set with the value from 'openai_api_base'.
+- This update ensures that the correct Azure endpoint is used when creating AzureOpenAIEmbeddings.
+## [Bumped version from 1.0.2 to 1.0.3](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/1c0c6c5c2e58321a2dd5f58c079c070d601e315c)
+Thu Dec 7 10:25:07 2023 -0500
+- Updated the version number in bumpver.toml, the Docker image version in the Kubernetes resources.yaml, and the application version in the app.py file of the langchain-streamlit-demo.
+## [Refactored variable name in AzureChatOpenAI constructor](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/17f45e34541f6182f43665bf6c0fe66b2a725eb8)
+Thu Dec 7 10:21:30 2023 -0500
+- Changed the variable name 'openai_api_base' to 'azure_endpoint' in the AzureChatOpenAI constructor for clarity and consistency.
+## [Update version from 1.0.1 to 1.0.2](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/8fee298d3553974031cad83e42e34b6559df5fe5)
+Mon Dec 4 11:27:10 2023 -0500
+- The version number has been updated in the following files: `bumpver.toml` (the project's version control file), `kubernetes/resources.yaml` (the Kubernetes resources configuration file), and `langchain-streamlit-demo/app.py` (the application's main Python file).
+- In `bumpver.toml`, the `current_version` variable has been updated to `1.0.2`.
+- In `kubernetes/resources.yaml`, the Docker image version has been updated to `1.0.2`.
+- In `langchain-streamlit-demo/app.py`, the `__version__` variable has been updated to `1.0.2`.
+## [Updated package versions in requirements.txt](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/3d7adb3b01d4565d59e4b999c69e2d554fab9f02)
+Mon Dec 4 11:11:37 2023 -0500
+- This commit updates the versions of several packages in the requirements.txt file. The updated packages include 'langchain', 'langsmith', 'openai', 'streamlit', and 'tiktoken'.
+- Such updates are necessary to keep the software up-to-date with the latest improvements, bug fixes, and security patches in the packages that it depends on.
+## [Updated version to 1.0.1](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/d15b0d2767d9647dd0b05649e5c1d008fa56920e)
+Thu Nov 30 15:19:39 2023 -0500
+- The version number in bumpver.toml, the Docker image tag in kubernetes/resources.yaml and the version in langchain-streamlit-demo/app.py have been updated from 1.0.0 to 1.0.1.
+## [Refactored error handling and added support for AzureOpenAIEmbeddings](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/ead1471ab8d44f8e1ad885100ba614a8a589de5a)
+Thu Nov 30 15:12:53 2023 -0500
+- This commit includes two main changes. First, the error handling in 'app.py' was refactored to correct the namespace for 'openai.AuthenticationError'.
+- Second, in 'llm_resources.py', the code was updated to include support for 'AzureOpenAIEmbeddings' in addition to the existing 'OpenAIEmbeddings'. This allows the application to use either OpenAI's standard embeddings or Azure's version, depending on the provided configuration.
+## [Upgraded project version from 0.3.0 to 1.0.0](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/a338494f3816bbb77360d2f43a515d1cc39cd760)
+Wed Nov 29 16:05:50 2023 -0500
+- Updated the current version in bumpver.toml from 0.3.0 to 1.0.0.
+- Modified the Docker image version in kubernetes/resources.yaml from joshuasundance/langchain-streamlit-demo:0.3.0 to joshuasundance/langchain-streamlit-demo:1.0.0.
+- Changed the __version__ variable in langchain-streamlit-demo/app.py from 0.3.0 to 1.0.0.
+## [Updated model list, library versions, and code formatting](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/3ca1115e20d1709f4ede77b0ce63fafcf42a362c)
+Wed Nov 29 16:01:38 2023 -0500
+- 1. In the 'defaults.py' file, the list of models was updated. New models were added and existing model names were updated.
+- 2. In the 'llm_resources.py' file, a minor code formatting change was made.
+- 3. In the 'requirements.txt' file, the versions of several libraries were updated, including 'anthropic', 'langchain', 'langsmith', and 'openai'.
+## [Updated version from 0.2.0 to 0.3.0](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/2d1ba795654b4c65e705f42a92eae7a382cc8e66)
+Mon Nov 27 16:46:11 2023 -0500
+- The version number has been updated from 0.2.0 to 0.3.0 in multiple files. This includes the bumpver.toml, which controls the project versioning, the Kubernetes resources.yaml, which specifies the Docker image version to use, and the main app.py file, which includes a version number for display in the web app.
+## [Updated caching decorator and minor code formatting](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/5cdfa32bdb13c91564a4e175bafe1bc04414d1d8)
+Mon Nov 27 14:47:58 2023 -0600
+- Replaced the `@st.cache_data` decorator with `@st.cache_resource` in `app.py` for the `get_texts_and_retriever_cacheable_wrapper` function. This change might be due to an update in the library or to utilize a more suitable caching method.
+- In `llm_resources.py`, removed an unnecessary line break and added a space for better code readability.
+## [Updated OpenAI library version](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/a88ba2b3040ffff0c93d1c6159b6120091f76e37)
+Mon Nov 27 12:36:16 2023 +0000
+- The OpenAI library version in the project's requirements has been updated from 0.28.1 to 1.3.5. This update may include new features, bug fixes, or performance improvements from the library.
+## [Updated langsmith package version](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/b3a6aa254b2acd40593ef0b0167e061cd5beb448)
+Mon Nov 27 12:36:12 2023 +0000
+- The langsmith package version in requirements.txt was updated from 0.0.63 to 0.0.66.
+## [Updated langchain version in requirements.txt](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/d6340145557e4727e4521c530efa8abe16060882)
+Mon Nov 27 12:36:07 2023 +0000
+- The langchain package version has been updated from 0.0.334 to 0.0.340 in the requirements.txt file. This update may include new features, bug fixes, or performance improvements.
+## [Updated anthropic package version](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/264cec5ebc6b618397d3b9449bf5277c3ad53c96)
+Mon Nov 27 12:36:01 2023 +0000
+- The anthropic package version in requirements.txt was updated from 0.5.0 to 0.7.4. No other dependencies were changed.
+## [Updated pypdf version](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/325c8315d4b388c71776a939a5267776940b26ce)
+Mon Nov 20 12:35:08 2023 +0000
+- The pypdf library was updated from version 3.17.0 to 3.17.1 in the requirements.txt file.
+## [Updated project version to 0.2.0](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/97d4687085a8c28a8c0a3a082e9cfa70d2fe853e)
+Fri Nov 10 21:30:40 2023 -0500
+- The version number in bumpver.toml has been updated from 0.1.2 to 0.2.0.
+- In the Kubernetes resources.yaml file, the image version of langchain-streamlit-demo has been updated to reflect the new version.
+- The __version__ variable in the app.py file of the langchain-streamlit-demo project has also been updated to 0.2.0.
+## [Updated pillow library version](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/f61858c54e1a37f8a7a734ca2c84c66cd62d77e4)
+Sat Nov 11 02:07:34 2023 +0000
+- The pillow library version was updated from 10.0.0 to 10.0.1 in the requirements.txt file. This change was made to avoid a vulnerability.
+## [Updated package versions in requirements.txt](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/d4691b420e22e6b27a3d968f1295d97bb3191376)
+Fri Nov 10 21:04:08 2023 -0500
+- Updated the versions of the 'langchain', 'langsmith', and 'streamlit' packages in the requirements.txt file.
+- Added 'pillow' and 'pyarrow' packages to the requirements.txt file.
+- These changes ensure that the project is using the latest and most secure versions of the dependencies.
+## [Bumped application version from 0.1.1 to 0.1.2](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/a51a26dd0cf4b33726ac3aa84b41acc103b0c06f)
+Wed Nov 1 16:03:52 2023 -0400
+- Updated the application version in bumpver.toml, resources.yaml, and app.py. This includes the version used for the Docker image in the Kubernetes deployment configuration.
+## [Updated default checkbox value and removed initial chatbot message](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/3d59c85771f67f633f9498ffa3705880576de914)
+Wed Nov 1 15:51:00 2023 -0400
+- Changed the default value of the 'Document Chat' checkbox to be true if a file is uploaded and false if not.
+- Removed the condition that disables the 'Chain Type' dropdown when 'Document Chat' is not selected.
+- Eliminated the automatic 'Hello! I'm a helpful AI chatbot. Ask me a question!' message when the chat history is empty.
+## [Version Bump to 0.1.1](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/fc0e83182e47a9f41465fa815b286455b10e78f9)
+Wed Nov 1 13:58:11 2023 -0400
+- This commit represents a version bump from 0.1.0 to 0.1.1. Changes were made in the bumpver.toml file to update the current version. The Docker image reference in the Kubernetes resources.yaml file was also updated to reflect the new version. Lastly, the __version__ variable in the langchain-streamlit-demo/app.py file was updated.
+## [Handled additional exception in app.py](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/8a23b378977a263201791101e5a0ebc56e4f5f05)
+Wed Nov 1 13:55:35 2023 -0400
+- Updated the exception handling in app.py to include LangSmithNotFoundError along with the existing LangSmithError. This change improves the robustness of the error handling mechanism.
+## [Updated project version to 0.1.0](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/bbb9f000d8907e12c2aea643fb01e234b8d771bc)
+Mon Oct 30 12:03:02 2023 -0400
+- The project's version number has been updated from 0.0.16 to 0.1.0 in the bumpver.toml file, kubernetes resource file, and the main application file.
+## [Added mistralai/Mistral-7B-Instruct-v0.1 to Anyscale Endpoints](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/d8cef94cffde0307292685d7273a0bf7a0974d02)
+Mon Oct 30 11:31:43 2023 -0400
+- In the README.md file, a new endpoint mistralai/Mistral-7B-Instruct-v0.1 was added under the section of Anyscale Endpoints.
+- In the defaults.py file, the same endpoint was added to the MODEL_DICT dictionary under the key-value pair 'mistralai/Mistral-7B-Instruct-v0.1': 'Anyscale Endpoints'.
+- The SUPPORTED_MODELS list was updated accordingly to include this new endpoint.
+## [Updated langsmith package version](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/018041a3bdd72aaf3ab62b6eecba51ac18c93bcd)
+Mon Oct 30 12:50:15 2023 +0000
+- The langsmith package version in requirements.txt has been updated from 0.0.49 to 0.0.53. This update might include bug fixes, new features, or improvements.
+## [Updated langchain version in requirements](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/1215664e1bcb9b0a1f7f90a608fa16dc68dbbd0a)
+Mon Oct 30 12:49:54 2023 +0000
+- The langchain package version in requirements.txt has been updated from 0.0.320 to 0.0.325. This update might include bug fixes, security patches or new features.
+## [Bump version from 0.0.15 to 0.0.16](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/04871e0362967e38aceb00aa4fd13818a793ff1a)
+Mon Oct 23 12:57:22 2023 -0400
+- Updated the current version in bumpver.toml from 0.0.15 to 0.0.16.
+- In the Kubernetes resources.yaml, updated the image version for langchain-streamlit-demo from 0.0.15 to 0.0.16.
+- In langchain-streamlit-demo/app.py, updated the __version__ variable from 0.0.15 to 0.0.16.
+## [Updated package versions in requirements.txt](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/839541a4fc5515d4554a36946001f1cee80f6fdc)
+Mon Oct 23 12:49:36 2023 -0400
+- Updated the versions of 'anthropic', 'langchain', and 'langsmith' in the requirements file. 'anthropic' is updated from version 0.3.11 to 0.5.0, 'langchain' from 0.0.315 to 0.0.320, and 'langsmith' from 0.0.44 to 0.0.49.
+## [Added 'validators' package to requirements](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/a1e0ab15cde332cd8efcba310fb67e25cb990783)
+Fri Oct 20 22:54:23 2023 +0000
+- The 'validators' package was added to the requirements.txt file. This package is not directly required by the project, but it has been pinned by Snyk to version 0.21.0 or newer to avoid a potential vulnerability.
+## [Updated badges in README](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/32f02019c445fb88beb73f00c6ffd0a17ff2a5d3)
+Thu Oct 19 15:19:10 2023 -0400
+- Replaced the Docker badge with a 'Push to Docker Hub' GitHub Actions workflow badge.
+- Added a 'Push to HuggingFace Space' GitHub Actions workflow badge.
+- Added an 'Update AI Changelog on Push to Main' GitHub Actions workflow badge.
+## [Added Azure OpenAI Service to README](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/3353ff5eaa74c050414bf6b67ac590ac25d19f74)
+Thu Oct 19 11:08:36 2023 -0400
+- Updated README.md to include Azure OpenAI Service in the list of services and endpoints. A placeholder for configurable endpoints under Azure OpenAI Service has also been added.
+## [Added Black component to misc.xml and updated badges in README.md](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/1fb27e8b839a4c3d526da009c05ef3c08a1c2786)
+Thu Oct 19 10:49:24 2023 -0400
+- The commit introduces two changes:
+- 1. A new Black component is added to the .idea/misc.xml file. This suggests that the Black Python code formatter has been configured for the project.
+- 2. The README.md file has been updated to include new badges for code maintainability, issues, technical debt, and known vulnerabilities. The order of the existing badges has also been rearranged.
+## [Version Bump from 0.0.14 to 0.0.15](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/cc115e36633b7d899076da029c59dda03ca177ec)
+Mon Oct 16 14:09:34 2023 -0400
+- The version number has been increased from 0.0.14 to 0.0.15. This change has been reflected in the bumpver.toml file, the Kubernetes resources file, and the langchain-streamlit-demo app.py file. The Docker image used in the Kubernetes resources file has also been updated to reflect this new version number.
+## [Updated several package versions in requirements.txt](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/cfa1e0b55c4f108b30ff6c7389668f1677f91437)
+Mon Oct 16 14:02:49 2023 -0400
+- Updated the version of langchain from 0.0.308 to 0.0.315.
+- Updated the version of langsmith from 0.0.43 to 0.0.44.
+- Updated the version of pypdf from 3.16.2 to 3.16.4.
+## [Updated environment variable name in Kubernetes config](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/62281947edc36d93259d723b8b4b63f3b9b646d1)
+Fri Oct 6 21:19:03 2023 -0400
+- In the Kubernetes configuration file 'resources.yaml', the environment variable name 'SHOW_LANGCHAIN_OPTIONS' was replaced with 'SHOW_LANGSMITH_OPTIONS'. This change reflects an update in the naming convention or the service being used.
+## [Bumped application version to 0.0.14](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/eb059075d36e4b09269df5b75dbea1b0e4e22f11)
+Fri Oct 6 20:59:11 2023 -0400
+- Updated the version of the application in bumpver.toml, kubernetes/resources.yaml, and langchain-streamlit-demo/app.py from 0.0.13 to 0.0.14.
+## [Refactored app.py to use Streamlit session state for storing global variables](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/e9f7a777844336b99d3bc8c2270e77e2acb0e7e7)
+Fri Oct 6 20:47:25 2023 -0400
+- This commit refactors the app.py file of the langchain-streamlit-demo to use Streamlit's session state for storing global variables. This includes API keys, project names, and Azure configurations. A new function 'azure_state_or_default' has been introduced to update the session state for Azure configurations. This change allows for better state management and persistence across multiple sessions.
+## [Added input field for Azure OpenAI EMB deployment name](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/b44c9a31a33a9b7d3b0e347a0ffe4ea31c068e81)
+Fri Oct 6 18:40:55 2023 -0400
+- An input field for the Azure OpenAI EMB deployment name has been added to the sidebar of the Streamlit application. This allows users to specify the name of their Azure OpenAI EMB deployment.
+## [Added Azure OpenAI Embeddings option to app](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/c60388636d63567bd9bfe4b7bbfebf734d3100da)
+Fri Oct 6 18:35:40 2023 -0400
+- This commit introduces the option to use Azure OpenAI for embeddings in the langchain-streamlit-demo app. It adds the necessary environment variables and updates the code to handle the new option. The changes include:
+- 1. Addition of the AZURE_OPENAI_EMB_DEPLOYMENT_NAME environment variable in the Kubernetes resources.
+- 2. Update of the app.py file to handle the Azure OpenAI option. If Azure embeddings are available, a toggle is displayed to the user to switch between Azure and OpenAI directly.
+- 3. Update of the get_texts_and_retriever function in llm_resources.py to accept additional arguments for azure_kwargs and use_azure.
+- 4. Update of the defaults.py file to include the AZURE_OPENAI_EMB_DEPLOYMENT_NAME in the list of Azure environment variables.
+## [Refactored code to improve readability and maintainability](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/0ce4fb3a9cb43ee563729df1d6b682511e17248f)
+Fri Oct 6 18:15:24 2023 -0400
+- 1. Updated kubernetes resource configuration to add environment variables for SHOW_LANGCHAIN_OPTIONS and SHOW_AZURE_OPTIONS.
+- 2. Refactored the app.py script to import default values from a single source, improving readability and maintainability of the code.
+- 3. Updated defaults.py to define a namedtuple for default values, which is imported in other scripts.
+- 4. Modified llm_resources.py to accommodate changes in the import of default values.
+## [Refactor code by moving logic to a separate module](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/21eccfc51cf90268826929cddbf2bfa42bc2f5eb)
+Fri Oct 6 16:26:26 2023 -0400
+- The commit moves a significant amount of logic from 'app.py' to a new module named 'llm_resources.py'. This includes the methods for getting the runnable instance, the language model, and the texts and retriever. The aim of this refactoring is to improve code organization, readability, and maintainability.
+## [Refactored code and improved project structure](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/87d698488900d63b992059b6f291d6981773fb4b)
+Fri Oct 6 15:59:43 2023 -0400
+- Moved model constants and environment variables into a separate 'defaults.py' file for better code organization and readability.
+- Updated 'app.py' to import these constants and variables from the new 'defaults.py' file.
+- Modified '.idea/langchain-streamlit-demo.iml' to include a new source folder, improving the project's structure.
+## [Added Azure OpenAI environment variables to Kubernetes deployment](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/f39ac3b55d8e57db36ff4a43a4b95dda1fa46e9d)
+Fri Oct 6 14:15:57 2023 -0400
+- In the Kubernetes resource configuration file, several environment variables related to Azure OpenAI have been added. These include the base URL, API version, deployment name, API key, and model version. The values for these variables are fetched from the 'langchain-streamlit-demo-secret' secret.
+## [Bumped version from 0.0.12 to 0.0.13](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/d767997980a751389dcbec81b1bcaa1c10267534)
+Fri Oct 6 14:03:44 2023 -0400
+- Updated the current_version in bumpver.toml from 0.0.12 to 0.0.13.
+- Updated the image tag in the Kubernetes resources.yaml file to use the new version 0.0.13.
+- Updated the __version__ variable in the app.py file to reflect the new version 0.0.13.
+## [Refactored application code and updated dependencies](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/979e3bd9fe449bea04e5ceda5c1a72be2e824c58)
+Fri Oct 6 13:58:33 2023 -0400
+- Refactored the application code in 'langchain-streamlit-demo/app.py' to improve clarity and organization. Changes include renaming 'AZURE' to 'Azure OpenAI' in the 'MODEL_DICT' and modifying related conditional checks, renaming 'Advanced Options' to 'Advanced Settings', and restructuring 'LangSmith Options' into its own section within the sidebar.
+- Updated the 'streamlit' version from '1.27.1' to '1.27.2' in 'requirements.txt'.
+## [Added support for Azure Chat models in the Streamlit application](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/72c3d8c60b3e15ce8d89f926ffe2ab845d3d9c1b)
+Fri Oct 6 13:50:43 2023 -0400
+- The commit introduces Azure Chat models into the Streamlit application. It includes the addition of the AzureChatOpenAI model in the import statement and the MODEL_DICT. Environment variables for Azure are also defined and retrieved from the system environment. User interface elements for Azure options have been added within an expandable section in the sidebar. Finally, an instance of AzureChatOpenAI is created if all Azure details are available and the selected provider is Azure.
+## [Updated langsmith package](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/e4b72fedeb71c822b6a76ed84199fef2bbc3bf8a)
+Fri Oct 6 13:02:43 2023 -0400
+- The langsmith package version was updated from 0.0.41 to 0.0.43 in the requirements.txt file.
+## [Updated langchain version in requirements.txt](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/2c41972749e5524bba738b37e6d31416e657fec6)
+Thu Oct 5 13:54:14 2023 +0000
+- The langchain package version in requirements.txt has been upgraded from 0.0.305 to 0.0.308. This update may include bug fixes, feature enhancements or performance improvements.
+## [Updated application version to 0.0.12](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/2bee8f19e2fa71c333588a3531b55fe062701328)
+Mon Oct 2 09:13:48 2023 -0400
+- The application version has been updated from 0.0.11 to 0.0.12 in three different files. These include bumpver.toml, resources.yaml under kubernetes, and app.py under langchain-streamlit-demo. In bumpver.toml, the current_version value is updated. In resources.yaml, the image version for the container 'langchain-streamlit-demo' is updated. In app.py, the __version__ variable is updated to reflect the new version.
+## [Updated dependencies in requirements.txt](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/9747a2d97d4e60861e6d0cc8de7ca8076a6ac971)
+Mon Oct 2 09:10:05 2023 -0400
+- The langchain and langsmith dependencies have been updated to versions 0.0.305 and 0.0.41 respectively.
+- The openai dependency has been updated to version 0.28.1.
+- The previous comment about rolling back the langchain update to avoid a bug has been removed, implying the bug has been fixed in the new version.
+## [Version Bump from 0.0.10 to 0.0.11](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/58978f749bdf319a2c2f76e74a46e7d905b7bf69)
+Sat Sep 30 01:31:32 2023 -0400
+- Updated the current_version in bumpver.toml from 0.0.10 to 0.0.11.
+- In the Kubernetes resources.yaml, updated the image version of langchain-streamlit-demo from 0.0.10 to 0.0.11.
+- In the langchain-streamlit-demo/app.py, updated the __version__ from 0.0.10 to 0.0.11.
+## [Updated README.md with minor content and structure changes](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/241c14d23e150e0be6edee2c28e32c1b4a519c73)
+Sat Sep 30 01:29:08 2023 -0400
+- This commit includes changes to the README.md file. The authorship of the README has been clarified to indicate that it was originally written by Claude 2. The Features section has been updated to include a new model from Anyscale Endpoints, and to mention the addition of various forms of document chat. The Code Overview section was removed. A minor formatting change was made to the Docker run command. The Docker Compose instructions were simplified by removing a redundant command.
+## [Improved UI labels and refactored code in langchain-streamlit-demo](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/f8e912146cbca42cbd456abb123b5223b0924c45)
+Sat Sep 30 01:24:47 2023 -0400
+- This commit includes changes to improve the user interface labels for better readability. The labels 'chunk_size' and 'chunk_overlap' have been changed to 'Number of Tokens per Chunk' and 'Chunk Overlap' respectively.
+- Additionally, the code for handling the full response and the initialization of the `st.session_state.chain` has been refactored for better readability and maintainability. The code now clearly distinguishes between the cases when `use_document_chat` is true or false, and the initialization of `st.session_state.chain` is more streamlined.
+## [Refactored chat functionality and removed unnecessary code in app.py and qagen.py](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/923e6fac55336c07c8af10b74742b117517bd757)
+Sat Sep 30 01:10:43 2023 -0400
+- In app.py, removed the StreamlitCallbackHandler import and simplified the logic for handling chat inputs. Removed the document chat condition in the if statement, and directly implemented the regular chat functionality. Simplified the condition for using document chat, and refactored the way rag_runnable is retrieved based on the document chat chain type.
+- In qagen.py, removed the unnecessary import of reduce from functools and the combine_qa_pair_lists function. Simplified the get_rag_qa_gen_chain function by directly converting the parsed_output to a string.
+## [Refactored code for readability and efficiency](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/bfaa0c3cf1792d9cb5086657f9ded983ba616662)
+Fri Sep 29 23:12:56 2023 -0400
+- This commit includes changes in the 'app.py' and 'qagen.py' files. In 'app.py', the code has been refactored to improve readability and efficiency. The configuration dictionary has been moved outside the if-conditions to avoid redundancy. Also, the condition checking for 'Summarization' and 'Q&A Generation' has been combined to reduce nested if-statements.
+- In the 'qagen.py' file, two new methods 'to_str' have been added to the 'QuestionAnswerPair' and 'QuestionAnswerPairList' classes. These methods convert the question and answer pairs into a string format. This change has moved the responsibility of string formatting from 'app.py' to 'qagen.py', making the code more modular and easier to maintain.
+## [Updated summarization functionality in Streamlit app](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/dd9bfbddff559ce0065c236ccc6419f987a61664)
+Fri Sep 29 22:43:24 2023 -0400
+- Replaced the existing get_summarization_chain function with get_rag_summarization_chain in the Streamlit app.
+- The get_rag_summarization_chain function now takes in the prompt, retriever and the language model as parameters.
+- Refactored the way the summarization chain is invoked and the full response is generated.
+- Updated the get_rag_summarization_chain function in the summarize module to return a RunnableSequence.
+## [Updated model_name parameter in ChatOpenAI instantiation](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/06099804b5d0a4d635beb8a0021ac84b22cb0529)
+Fri Sep 29 18:38:23 2023 -0400
+- Replaced hardcoded 'test' value for model_name parameter with a variable named 'model'. This change allows the model name to be dynamically set when the ChatOpenAI class is instantiated.
+## [Refactored model instantiation and removed deprecated functions](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/c2ef57040f3231cc3fa80157d93d0d8420f21351)
+Fri Sep 29 18:38:01 2023 -0400
+- Updated the instantiation of ChatOpenAI, ChatAnthropic, and ChatAnyscale classes by swapping the model and model_name parameters to match their class definitions.
+- Removed the commented out get_qa_gen_chain function in qagen.py.
+- Removed commented out code related to raw_results and results in app.py, simplifying the logic.
+## [Refactored the data processing pipeline](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/8106321374be538f2740587a9a3d68e9cb82310f)
+Fri Sep 29 18:31:46 2023 -0400
+- Removed the 'combine_qa_pair_lists' function from the data processing pipeline in 'app.py'.
+- Directly accessed 'QuestionAnswerPairs' from 'raw_results' instead of using 'combine_qa_pair_lists' function.
+- Commented out the print statement for 'raw_results'.
+## [Refactored code to change 'input' to 'context' in langchain-streamlit-demo](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/3550ebd119e342869167a228929538c069350942)
+Fri Sep 29 18:19:58 2023 -0400
+- This commit includes a change in the variable name from 'input' to 'context' in both app.py and qagen.py files. The change was made in the section where the document page content is being processed. This change is likely aimed at improving code readability and consistency.
+## [Added customizability for number of chunks in retriever](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/457889e5dc68143a1a5f935ca6af849bd380666c)
+Fri Sep 29 18:16:51 2023 -0400
+- This commit introduces a slider in the UI allowing the user to select the number of chunks that will be used for context in the retriever. The 'get_texts_and_retriever' function was updated to include a new parameter 'k' that defaults to the newly introduced constant 'DEFAULT_RETRIEVER_K'. This 'k' value is then used in the creation of both the 'bm25_retriever' and 'faiss_retriever'.
+## [Updated Q&A Generation method and invocation](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/8aab446c1cbafbdb04dcf6d56ed77413f1e63f65)
+Fri Sep 29 18:13:30 2023 -0400
+- Replaced the get_qa_gen_chain method with get_rag_qa_gen_chain in app.py and qagen.py. This change updates the Q&A Generation method used in the Document Chat feature.
+- Changed the way the Q&A Generation method is invoked. Instead of using the batch method, we now use the invoke method. This change is expected to improve the efficiency of the Document Chat feature.
+## [Implemented RAG-based Q&A Generation Chain](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/6467ea59cd8b5eb4859d20c8f84152402833cb92)
+Fri Sep 29 18:04:08 2023 -0400
+- Added a new function 'get_rag_qa_gen_chain' in 'qagen.py' to set up a RAG-based Q&A generation chain using a retriever and a language model.
+- Adjusted the 'app.py' to include a commented-out option to use the new RAG-based Q&A generation chain.
+## [Bump version from 0.0.9 to 0.0.10](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/bb29f017b57cd891d1f9ae86e212ec6c92b5aa43)
+Fri Sep 29 13:17:34 2023 -0400
+- Updated the version number in the bumpver.toml, kubernetes/resources.yaml, and langchain-streamlit-demo/app.py files. The new version is 0.0.10.
+## [Updated retriever logic and removed question validation](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/930d4126fe97dbb403fa498b5322e10815d06179)
+Fri Sep 29 11:17:45 2023 -0400
+- In the 'langchain-streamlit-demo/app.py' file, the logic to retrieve texts has been updated. The FAISS retriever has been replaced with an ensemble retriever that uses both the BM25 and FAISS retrievers. The BM25 retriever's 'k' parameter has been set to 4, and the FAISS retriever has been updated to use a vector store.
+- In the 'langchain-streamlit-demo/qagen.py' file, the field validator for the 'question' field in the 'QuestionAnswerPair' class has been removed. This means that questions no longer need to end with a question mark to be valid.
+- The 'requirements.txt' file has been updated to include the 'rank_bm25==0.2.2' package, and the 'streamlit' package has been updated to version '1.27.1'.
+## [Updated the refine_template in summarize.py](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/736288ed897a6bf1b5c0be7c0481011598351395)
+Thu Sep 28 20:55:25 2023 -0400
+- The refine_template string in the summarize.py file has been updated. A newline character has been added after the 'User input: {query}' part of the string for better readability.
+## [Updated application version to 0.0.9](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/40604bea7723c4c05b4c36289950e6d8a25b7690)
+Thu Sep 28 20:41:33 2023 -0400
+- The version number in the bumpver.toml file has been updated from 0.0.8 to 0.0.9.
+- The Docker image version for the langchain-streamlit-demo app in the Kubernetes resources.yaml file has been updated from 0.0.8 to 0.0.9.
+- The __version__ variable in the app.py file of the langchain-streamlit-demo app has been updated from 0.0.8 to 0.0.9.
+## [Improved text formatting in Q&A response](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/4eaf9de17247ed7e6bdc1771ff31639cca9e903d)
+Thu Sep 28 20:39:28 2023 -0400
+- This commit adjusts the formatting of the Q&A response in the langchain-streamlit-demo app. It adds an extra newline between the question and answer parts, and another newline between each Q&A pair for better readability.
+## [Updated application version to 0.0.8](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/8c80fe821129d05b8b714beb56a4e0bbca6ce676)
+Thu Sep 28 20:36:46 2023 -0400
+- The application's version number has been updated from 0.0.7 to 0.0.8 in the following files: bumpver.toml, resources.yaml, and app.py.
+- In bumpver.toml, the current_version field was updated to reflect the new version.
+- In resources.yaml, the image tag for the langchain-streamlit-demo container was updated to use the new version.
+- In app.py, the __version__ variable was updated to the new version.
+## [Refactor variable names in Streamlit app](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/9bf9004ce3ba4160e1c33f57e0c5e48c0ff4f628)
+Thu Sep 28 20:33:17 2023 -0400
+- The variable 'output_text' was renamed to 'full_response' in the Streamlit application to better reflect its purpose. This change improves code readability and understanding.
+## [Bumped version from 0.0.6 to 0.0.7](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/d41f4a4356709af4dbd81982fdefb0a6dba21ef6)
+Thu Sep 28 19:56:12 2023 -0400
+- Updated the version number in bumpver.toml, resources.yaml, and app.py.
+- This commit includes changes to the version number in the bumpver configuration, the Docker image tag in the Kubernetes resources, and the version variable in the app.py file.
+## [Added Summarization Feature to Streamlit App](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/47c2ffc283d1e1754c1f64ab5fb793694bc9f24f)
+Thu Sep 28 19:53:59 2023 -0400
+- This commit introduces a summarization feature to the Streamlit application. It does so by creating a new 'summarize.py' file and integrating it into the 'app.py' file.
+- In 'app.py', the 'LLMChain' import has been moved and the 'get_summarization_chain' function has been imported from 'summarize.py'.
+- A new option 'Summarization' has been added to the 'Document Chat Chain Type' dropdown menu.
+- When 'Summarization' is selected from the dropdown, the 'get_summarization_chain' function is called to create a summarization chain.
+- The summarization chain is then used to generate a summary of the document, which is displayed in the Streamlit app.
+- In the 'summarize.py' file, a new summarization chain is defined using the 'load_summarize_chain' function from the 'langchain.chains.summarize' module. The chain uses two custom prompt templates for summarizing and refining the document text.
+## [Enhanced document chat functionality in langchain-streamlit-demo](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/622ac6610de2f89368031d57ebd148259e5d7fcc)
+Thu Sep 28 16:55:16 2023 -0400
+- This commit includes enhancements to the document chat functionality in the langchain-streamlit-demo application. It introduces a new document chat chain type 'Q&A Generation' and updates the provider variable to be stored in the session state. The commit also adds a new file 'qagen.py' which contains code for generating question and answer pairs from a given text.
+## [Bump version from 0.0.5 to 0.0.6](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/f431ca56717b9e704226c3448a552fe31c90d77d)
+Thu Sep 28 14:42:31 2023 -0400
+- The version number in the 'bumpver.toml', 'kubernetes/resources.yaml', and 'langchain-streamlit-demo/app.py' files has been updated from 0.0.5 to 0.0.6. This indicates a new iteration of the software with potential minor changes or bug fixes.
+## [Updated ruff-pre-commit version](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/50b28c9ac810cf9ff1c58e0b98f4ca7dfe3f94f5)
+Wed Sep 27 20:58:22 2023 -0400
+- The ruff-pre-commit version in the pre-commit configuration file was updated from v0.0.290 to v0.0.291.
+## [Updated file exclusions in pre-commit config](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/c8b46036933d50ca6befc5d4fa43bcb29f05c75a)
+Wed Sep 27 20:57:54 2023 -0400
+- The pre-commit configuration has been updated to exclude the AI_CHANGELOG.md file. Previously, the configuration was set to exclude .idea and docs directories. The repository and hook details remain unchanged.
+## [Refactored chain_type_help in app.py and updated AI_CHANGELOG.md](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/a1b0a6fd0b22021079e741929eb7671855192cb0)
+Wed Sep 27 20:56:47 2023 -0400
+- In app.py, the chain_type_help dictionary was refactored to directly generate a string with the help links for each chain_type_name, removing the need for a separate dictionary.
+- In AI_CHANGELOG.md, a newline was added at the end of the file and entries were made for the addition of numpy and tornado to requirements.txt and the update of the token used for code checkout in the GitHub workflow.
+## [Updated GitHub Action to Push to HuggingFace Space](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/e95e574c846541fd959bd0d0355178fae542dd8e)
+Wed Sep 27 17:05:25 2023 +0000
+- This commit modifies the triggering conditions for the GitHub Action workflow that pushes updates to HuggingFace Space. Previously, the workflow was triggered on each push with any tag. Now, it is triggered upon completion of the 'Update AI Changelog on Push to Main' workflow on the 'main' branch.
+- Additionally, the 'push-to-huggingface' job has been updated to depend on the completion of the 'update-changelog' job.
+## [Updated version number from 0.0.2 to 0.0.5](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/55fa7419137cf54127cbd03114c0c0284397cfd9)
+Wed Sep 27 10:56:40 2023 -0400
+- The version number in the bumpver configuration file has been updated from 0.0.2 to 0.0.5.
+- The image version in the Kubernetes resources file has been updated to match the new version number.
+- The __version__ variable in the langchain-streamlit-demo app has been updated to reflect the new version number.
+## [Updated page title to include version number](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/783c740fe52c44c3f3d9d5ad78b6c1784fa93e97)
+Wed Sep 27 10:46:57 2023 -0400
+- The page title of the Streamlit application was previously just the name of the application. The change now includes the version number in the title, which will make it easier to track and verify the version of the application in use.
+## [Added 'codellama/CodeLlama-34b-Instruct-hf' to Model Dictionary](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/68f6d34a4cefd91425cbc215f323fbd57dd6e4a7)
+Wed Sep 27 10:46:24 2023 -0400
+- The commit introduces a new model 'codellama/CodeLlama-34b-Instruct-hf' into the MODEL_DICT dictionary. This update extends the list of models supported by the 'Anyscale Endpoints'.
+## [Bumped version from 0.0.1 to 0.0.2](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/9feadf73e8c66425a565c99ce3088249bc4699f1)
+Wed Sep 27 00:03:38 2023 -0400
+- Updated the version number in bumpver.toml, Kubernetes resources.yaml, and the app.py file of the langchain-streamlit-demo application. The new version is 0.0.2.
+## [Updated app version](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/a1065bb282837cf191d30bcb45c638bd15c5b77a)
+Wed Sep 27 00:00:28 2023 -0400
+- The version number in langchain-streamlit-demo/app.py was updated from 0.0.0 to 0.0.1.
+## [Updated image version in Kubernetes resources and bumpver file](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/35cffe74d37db50ad5ae17a6e6af4d2131c1a5c3)
+Tue Sep 26 23:59:47 2023 -0400
+- In the 'bumpver.toml' file, the image version placeholder in 'kubernetes/resources.yaml' was corrected by removing the unnecessary quotes.
+- In the 'kubernetes/resources.yaml' file, the image version for 'langchain-streamlit-demo' was updated from 'latest' to '0.0.1'.
+## [Implement versioning and modify GitHub workflows](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/7f34c9b5e16996dcb8eb5cdd3f5cdc86d7bf2b11)
+Tue Sep 26 23:58:24 2023 -0400
+- Introduced semantic versioning using bumpver. The current version is now tracked in a new file 'bumpver.toml' and also reflected in 'app.py' and the Docker image tag in 'kubernetes/resources.yaml'.
+- Modified GitHub workflows 'docker-hub.yml' and 'hf-space.yml' to trigger on new tags instead of pushes to the main branch. The Docker image tag is now the release version instead of the git SHA.
+- Removed the step to store the git SHA in 'docker-hub.yml'.
+- No functional changes were made to 'langchain-streamlit-demo/app.py' or 'kubernetes/resources.yaml'. The imagePullPolicy remains as 'Always'.
+## [Updated requirements.txt for better package management](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/5085ade2d646a2670929e518e78b881ea2ffd0a5)
+Tue Sep 26 23:14:05 2023 -0400
+- Rolled back langchain package from version 0.0.301 to 0.0.300 to avoid a bug in langchain's chatanthropic.
+- Pinned numpy to version 1.22.2 as suggested by Snyk to avoid a vulnerability.
+- Reordered the packages for better readability.
+## [Added numpy and tornado to requirements.txt to avoid vulnerabilities](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/3f0e220f9f77d561510dd04b09f1c3c509a5b28f)
+Tue Sep 26 12:56:59 2023 +0000
+- The numpy and tornado packages were added to the requirements.txt file. These packages are not directly required by our application but were added to avoid potential vulnerabilities as suggested by Snyk.
+## [Updated token used for code checkout in GitHub workflow](https://github.com/joshuasundance-swca/langchain-streamlit-demo/commit/b0c4e1ca12f86ea6113ee2c86d38c39d3035f395)
+Tue Sep 26 08:56:55 2023 -0400
+- In the GitHub Actions workflow file 'ai_changelog.yml', the personal access token used for checking out code has been updated. The token has been changed from 'PAT' to 'WORKFLOW_GIT_ACCESS_TOKEN'.

Dockerfile ADDED Viewed

	@@ -0,0 +1,19 @@

+FROM python:3.11-slim-bookworm
+RUN adduser --uid 1000 --disabled-password --gecos '' appuser
+USER 1000
+ENV PYTHONDONTWRITEBYTECODE=1 \
+    PYTHONUNBUFFERED=1 \
+    PATH="/home/appuser/.local/bin:$PATH"
+RUN pip install --user --no-cache-dir --upgrade pip
+COPY ./requirements.txt /home/appuser/requirements.txt
+RUN pip install --user --no-cache-dir  --upgrade -r /home/appuser/requirements.txt
+COPY ./langchain-streamlit-demo/ /home/appuser/langchain-streamlit-demo/
+WORKDIR /home/appuser/langchain-streamlit-demo
+EXPOSE 7860
+CMD ["streamlit", "run", "/home/appuser/langchain-streamlit-demo/app.py", "--server.port", "7860", "--server.address", "0.0.0.0"]

LICENSE ADDED Viewed

	@@ -0,0 +1,9 @@

+MIT License
+Copyright (c) 2023 Joshua Sundance Bailey
+Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.

README.md ADDED Viewed

	@@ -0,0 +1,112 @@

+---
+title: langchain-streamlit-demo
+emoji: 🦜
+colorFrom: green
+colorTo: red
+sdk: docker
+app_port: 7860
+pinned: true
+tags: [langchain, streamlit, docker]
+---
+# langchain-streamlit-demo
+[![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
+[![python](https://img.shields.io/badge/Python-3.11-3776AB.svg?style=flat&logo=python&logoColor=white)](https://www.python.org)
+[![Push to Docker Hub](https://github.com/joshuasundance-swca/langchain-streamlit-demo/actions/workflows/docker-hub.yml/badge.svg)](https://github.com/joshuasundance-swca/langchain-streamlit-demo/actions/workflows/docker-hub.yml)
+[![Docker Image Size (tag)](https://img.shields.io/docker/image-size/joshuasundance/langchain-streamlit-demo/latest)](https://hub.docker.com/r/joshuasundance/langchain-streamlit-demo)
+[![Push to HuggingFace Space](https://github.com/joshuasundance-swca/langchain-streamlit-demo/actions/workflows/hf-space.yml/badge.svg)](https://github.com/joshuasundance-swca/langchain-streamlit-demo/actions/workflows/hf-space.yml)
+[![Open HuggingFace Space](https://huggingface.co/datasets/huggingface/badges/raw/main/open-in-hf-spaces-sm.svg)](https://huggingface.co/spaces/joshuasundance/langchain-streamlit-demo)
+![Code Climate maintainability](https://img.shields.io/codeclimate/maintainability/joshuasundance-swca/langchain-streamlit-demo)
+![Code Climate issues](https://img.shields.io/codeclimate/issues/joshuasundance-swca/langchain-streamlit-demo)
+![Code Climate technical debt](https://img.shields.io/codeclimate/tech-debt/joshuasundance-swca/langchain-streamlit-demo)
+[![pre-commit](https://img.shields.io/badge/pre--commit-enabled-brightgreen?logo=pre-commit&logoColor=white)](https://github.com/pre-commit/pre-commit)
+[![Ruff](https://img.shields.io/endpoint?url=https://raw.githubusercontent.com/charliermarsh/ruff/main/assets/badge/v1.json)](https://github.com/charliermarsh/ruff)
+[![Checked with mypy](http://www.mypy-lang.org/static/mypy_badge.svg)](http://mypy-lang.org/)
+[![Code style: black](https://img.shields.io/badge/code%20style-black-000000.svg)](https://github.com/psf/black)
+[![security: bandit](https://img.shields.io/badge/security-bandit-yellow.svg)](https://github.com/PyCQA/bandit)
+![Known Vulnerabilities](https://snyk.io/test/github/joshuasundance-swca/langchain-streamlit-demo/badge.svg)
+[![Update AI Changelog on Push to Main](https://github.com/joshuasundance-swca/langchain-streamlit-demo/actions/workflows/ai_changelog.yml/badge.svg)](https://github.com/joshuasundance-swca/langchain-streamlit-demo/actions/workflows/ai_changelog.yml)
+This project shows how to build a simple chatbot UI with [Streamlit](https://streamlit.io) and [LangChain](https://langchain.com).
+This `README` was originally written by [Claude 2](https://www.anthropic.com/index/claude-2), an LLM from [Anthropic](https://www.anthropic.com/).
+# Features
+- Chat interface for talking to AI assistant
+- Supports models from
+  - [OpenAI](https://openai.com/)
+    - `gpt-3.5-turbo`
+    - `gpt-4`
+  - [Anthropic](https://www.anthropic.com/)
+    - `claude-instant-v1`
+    - `claude-2`
+  - [Anyscale Endpoints](https://endpoints.anyscale.com/)
+    - `meta-llama/Llama-2-7b-chat-hf`
+    - `meta-llama/Llama-2-13b-chat-hf`
+    - `meta-llama/Llama-2-70b-chat-hf`
+    - `codellama/CodeLlama-34b-Instruct-hf`
+    - `mistralai/Mistral-7B-Instruct-v0.1`
+  - [Azure OpenAI Service](https://azure.microsoft.com/en-us/products/ai-services/openai-service/)
+    - `[configurable]`
+- Streaming output of assistant responses
+- Leverages LangChain for dialogue and memory management
+- Integrates with [LangSmith](https://smith.langchain.com) for tracing conversations
+- Allows giving feedback on assistant's responses
+- Tries reading API keys and default values from environment variables
+- Parameters in sidebar can be customized
+- Includes various forms of document chat
+  - Question/Answer Pair Generation
+  - Summarization
+  - Standard retrieval chains
+# Deployment
+`langchain-streamlit-demo` is deployed as a [Docker image](https://hub.docker.com/r/joshuasundance/langchain-streamlit-demo) based on the [`python:3.11-slim-bookworm`](https://github.com/docker-library/python/blob/81b6e5f0643965618d633cd6b811bf0879dee360/3.11/slim-bookworm/Dockerfile) image.
+CI/CD workflows in `.github/workflows` handle building and publishing the image as well as pushing it to Hugging Face.
+## Run on HuggingFace Spaces
+[![Open HuggingFace Space](https://huggingface.co/datasets/huggingface/badges/raw/main/open-in-hf-spaces-sm.svg)](https://huggingface.co/spaces/joshuasundance/langchain-streamlit-demo)
+## With Docker (pull from Docker Hub)
+1. _Optional_: Create a `.env` file based on `.env-example`
+2. Run in terminal:
+`docker run -p 7860:7860 joshuasundance/langchain-streamlit-demo:latest`
+or
+`docker run -p 7860:7860 --env-file .env joshuasundance/langchain-streamlit-demo:latest`
+3. Open http://localhost:7860 in your browser
+## Docker Compose (build locally)
+1. Clone the repo. Navigate to cloned repo directory
+2. _Optional_: Create a `.env` file based on `.env-example`
+3. Run in terminal:
+`docker compose up`
+4. Open http://localhost:7860 in your browser
+## Kubernetes
+1. Clone the repo. Navigate to cloned repo directory
+2. Create a `.env` file based on `.env-example`
+3. Run bash script: `/bin/bash ./kubernetes/deploy.sh`
+4. Get the IP address for your new service: `kubectl get service langchain-streamlit-demo`
+# Links
+- [Streamlit](https://streamlit.io)
+- [LangChain](https://langchain.com)
+- [LangSmith](https://smith.langchain.com)
+- [OpenAI](https://openai.com/)
+- [Anthropic](https://www.anthropic.com/)
+- [Anyscale Endpoints](https://endpoints.anyscale.com/)
+- [Azure OpenAI Service](https://azure.microsoft.com/en-us/products/ai-services/openai-service/)

bumpver.toml ADDED Viewed

	@@ -0,0 +1,18 @@

+[bumpver]
+current_version = "2.1.4"
+version_pattern = "MAJOR.MINOR.PATCH"
+commit_message = "bump version {old_version} -> {new_version}"
+tag_message = "{new_version}"
+tag_scope = "default"
+pre_commit_hook = ""
+post_commit_hook = ""
+commit = true
+tag = true
+push = true
+[bumpver.file_patterns]
+"bumpver.toml" = [
+    'current_version = "{version}"',
+]
+"langchain-streamlit-demo/app.py" = ['__version__ = "{version}"']
+"kubernetes/resources.yaml" = ['        image: joshuasundance/langchain-streamlit-demo:{version}']

docker-compose.yml ADDED Viewed

	@@ -0,0 +1,16 @@

+version: '3.8'
+services:
+  langchain-streamlit-demo:
+    image: langchain-streamlit-demo:latest
+    build: .
+    env_file:
+      - .env
+    ports:
+      - "${APP_PORT:-7860}:${APP_PORT:-7860}"
+    command: [
+      "streamlit", "run",
+      "/home/appuser/langchain-streamlit-demo/app.py",
+      "--server.port", "${APP_PORT:-7860}",
+      "--server.address", "0.0.0.0"
+    ]

kubernetes/deploy.sh ADDED Viewed

	@@ -0,0 +1,19 @@

+#!/bin/bash
+set -euo pipefail
+IFS=$'\n\t'
+# Create a secret for environment variables
+secretExists=$(kubectl get secret langchain-streamlit-demo-secret --ignore-not-found)
+if [ -n "$secretExists" ]; then
+  echo "Secret 'langchain-streamlit-demo-secret' already exists. Deleting and recreating."
+  kubectl delete secret langchain-streamlit-demo-secret
+else
+  echo "Secret 'langchain-streamlit-demo-secret' does not exist. Creating."
+fi
+kubectl create secret generic langchain-streamlit-demo-secret --from-env-file=.env
+# Deploy to Kubernetes
+kubectl apply -f kubernetes/resources.yaml

kubernetes/resources.yaml ADDED Viewed

	@@ -0,0 +1,118 @@

+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: langchain-streamlit-demo-deployment
+spec:
+  replicas: 1
+  selector:
+    matchLabels:
+      app: langchain-streamlit-demo
+  template:
+    metadata:
+      labels:
+        app: langchain-streamlit-demo
+    spec:
+      containers:
+      - name: langchain-streamlit-demo
+        image: joshuasundance/langchain-streamlit-demo:2.1.4
+        imagePullPolicy: Always
+        resources:
+          requests:
+            cpu: "100m"
+            memory: "200Mi"
+          limits:
+            cpu: "500m"
+            memory: "500Mi"
+        env:
+          - name: AZURE_OPENAI_BASE_URL
+            valueFrom:
+              secretKeyRef:
+                name: langchain-streamlit-demo-secret
+                key: AZURE_OPENAI_BASE_URL
+          - name: AZURE_OPENAI_API_VERSION
+            valueFrom:
+              secretKeyRef:
+                name: langchain-streamlit-demo-secret
+                key: AZURE_OPENAI_API_VERSION
+          - name: AZURE_OPENAI_DEPLOYMENT_NAME
+            valueFrom:
+              secretKeyRef:
+                name: langchain-streamlit-demo-secret
+                key: AZURE_OPENAI_DEPLOYMENT_NAME
+          - name: AZURE_OPENAI_EMB_DEPLOYMENT_NAME
+            valueFrom:
+              secretKeyRef:
+                name: langchain-streamlit-demo-secret
+                key: AZURE_OPENAI_EMB_DEPLOYMENT_NAME
+          - name: AZURE_OPENAI_API_KEY
+            valueFrom:
+              secretKeyRef:
+                name: langchain-streamlit-demo-secret
+                key: AZURE_OPENAI_API_KEY
+          - name: AZURE_OPENAI_MODEL_VERSION
+            valueFrom:
+              secretKeyRef:
+                name: langchain-streamlit-demo-secret
+                key: AZURE_OPENAI_MODEL_VERSION
+          - name: OPENAI_API_KEY
+            valueFrom:
+              secretKeyRef:
+                name: langchain-streamlit-demo-secret
+                key: OPENAI_API_KEY
+          - name: ANTHROPIC_API_KEY
+            valueFrom:
+              secretKeyRef:
+                name: langchain-streamlit-demo-secret
+                key: ANTHROPIC_API_KEY
+          - name: ANYSCALE_API_KEY
+            valueFrom:
+              secretKeyRef:
+                name: langchain-streamlit-demo-secret
+                key: ANYSCALE_API_KEY
+          - name: LANGCHAIN_API_KEY
+            valueFrom:
+              secretKeyRef:
+                name: langchain-streamlit-demo-secret
+                key: LANGCHAIN_API_KEY
+          - name: LANGCHAIN_PROJECT
+            value: "langchain-streamlit-demo"
+          - name: SHOW_LANGSMITH_OPTIONS
+            value: "False"
+          - name: SHOW_AZURE_OPTIONS
+            value: "False"
+        securityContext:
+          runAsNonRoot: true
+---
+apiVersion: v1
+kind: Service
+metadata:
+  name: langchain-streamlit-demo-service
+  # configure on Azure and uncomment below to use a vnet
+#  annotations:
+#    service.beta.kubernetes.io/azure-load-balancer-internal: "true"
+#    service.beta.kubernetes.io/azure-load-balancer-ipv4: vnet.ip.goes.here
+#    service.beta.kubernetes.io/azure-dns-label-name: "langchain-streamlit-demo"
+spec:
+  selector:
+    app: langchain-streamlit-demo
+  ports:
+    - protocol: TCP
+      port: 80
+      targetPort: 7860
+  type: LoadBalancer
+---
+apiVersion: networking.k8s.io/v1
+kind: NetworkPolicy
+metadata:
+  name: langchain-streamlit-demo-network-policy
+spec:
+  podSelector:
+    matchLabels:
+      app: langchain-streamlit-demo
+  policyTypes:
+  - Ingress
+  ingress:
+  - from: []  # An empty array here means it will allow traffic from all sources.
+    ports:
+    - protocol: TCP
+      port: 7860

langchain-streamlit-demo/.streamlit/config.toml ADDED Viewed

	@@ -0,0 +1,6 @@

+[theme]
+primaryColor="#F63366"
+backgroundColor="#FFFFFF"
+secondaryBackgroundColor="#F0F2F6"
+textColor="#262730"
+font="sans serif"

langchain-streamlit-demo/app.py ADDED Viewed

	@@ -0,0 +1,627 @@

+from datetime import datetime
+from typing import Tuple, List, Dict, Any, Union, Optional
+import anthropic
+import langsmith.utils
+import openai
+import streamlit as st
+from langchain.agents import load_tools
+from langchain.agents.tools import tool
+from langchain.callbacks import StreamlitCallbackHandler
+from langchain.callbacks.base import BaseCallbackHandler
+from langchain.callbacks.manager import Callbacks
+from langchain.callbacks.tracers.langchain import LangChainTracer, wait_for_all_tracers
+from langchain.callbacks.tracers.run_collector import RunCollectorCallbackHandler
+from langchain.memory import ConversationBufferMemory, StreamlitChatMessageHistory
+from langchain.prompts import ChatPromptTemplate, MessagesPlaceholder
+from langchain.schema.document import Document
+from langchain.schema.retriever import BaseRetriever
+from langchain.tools import DuckDuckGoSearchRun, WikipediaQueryRun
+from langchain.utilities import WikipediaAPIWrapper
+from langsmith.client import Client
+from streamlit_feedback import streamlit_feedback
+from defaults import default_values
+from llm_resources import (
+    get_agent,
+    get_doc_agent,
+    get_llm,
+    get_runnable,
+    get_texts_and_multiretriever,
+)
+from python_coder import get_agent as get_python_agent
+from research_assistant.chain import get_chain as get_research_assistant_chain
+__version__ = "2.1.4"
+# --- Initialization ---
+st.set_page_config(
+    page_title=f"langchain-streamlit-demo v{__version__}",
+    page_icon="🦜",
+)
+def st_init_null(*variable_names) -> None:
+    for variable_name in variable_names:
+        if variable_name not in st.session_state:
+            st.session_state[variable_name] = None
+st_init_null(
+    "chain",
+    "client",
+    "doc_chain",
+    "document_chat_chain_type",
+    "llm",
+    "ls_tracer",
+    "provider",
+    "retriever",
+    "run",
+    "run_id",
+    "trace_link",
+    "LANGSMITH_API_KEY",
+    "LANGSMITH_PROJECT",
+    "AZURE_OPENAI_BASE_URL",
+    "AZURE_OPENAI_API_VERSION",
+    "AZURE_OPENAI_DEPLOYMENT_NAME",
+    "AZURE_OPENAI_EMB_DEPLOYMENT_NAME",
+    "AZURE_OPENAI_API_KEY",
+    "AZURE_OPENAI_MODEL_VERSION",
+    "AZURE_AVAILABLE",
+)
+# --- LLM globals ---
+STMEMORY = StreamlitChatMessageHistory(key="langchain_messages")
+MEMORY = ConversationBufferMemory(
+    chat_memory=STMEMORY,
+    return_messages=True,
+    memory_key="chat_history",
+)
+RUN_COLLECTOR = RunCollectorCallbackHandler()
+st.session_state.LANGSMITH_API_KEY = (
+    st.session_state.LANGSMITH_API_KEY
+    or default_values.PROVIDER_KEY_DICT.get("LANGSMITH")
+)
+st.session_state.LANGSMITH_PROJECT = st.session_state.LANGSMITH_PROJECT or (
+    default_values.DEFAULT_LANGSMITH_PROJECT or "langchain-streamlit-demo"
+)
+def azure_state_or_default(*args):
+    st.session_state.update(
+        {
+            arg: st.session_state.get(arg) or default_values.AZURE_DICT.get(arg)
+            for arg in args
+        },
+    )
+azure_state_or_default(
+    "AZURE_OPENAI_BASE_URL",
+    "AZURE_OPENAI_API_VERSION",
+    "AZURE_OPENAI_DEPLOYMENT_NAME",
+    "AZURE_OPENAI_EMB_DEPLOYMENT_NAME",
+    "AZURE_OPENAI_API_KEY",
+    "AZURE_OPENAI_MODEL_VERSION",
+)
+st.session_state.AZURE_AVAILABLE = all(
+    [
+        st.session_state.AZURE_OPENAI_BASE_URL,
+        st.session_state.AZURE_OPENAI_API_VERSION,
+        st.session_state.AZURE_OPENAI_DEPLOYMENT_NAME,
+        st.session_state.AZURE_OPENAI_API_KEY,
+        st.session_state.AZURE_OPENAI_MODEL_VERSION,
+    ],
+)
+st.session_state.AZURE_EMB_AVAILABLE = (
+    st.session_state.AZURE_AVAILABLE
+    and st.session_state.AZURE_OPENAI_EMB_DEPLOYMENT_NAME
+)
+AZURE_KWARGS = (
+    None
+    if not st.session_state.AZURE_EMB_AVAILABLE
+    else {
+        "openai_api_base": st.session_state.AZURE_OPENAI_BASE_URL,
+        "openai_api_version": st.session_state.AZURE_OPENAI_API_VERSION,
+        "deployment": st.session_state.AZURE_OPENAI_EMB_DEPLOYMENT_NAME,
+        "openai_api_key": st.session_state.AZURE_OPENAI_API_KEY,
+        "openai_api_type": "azure",
+    }
+)
+@st.cache_resource
+def get_texts_and_retriever_cacheable_wrapper(
+    uploaded_file_bytes: bytes,
+    openai_api_key: str,
+    chunk_size: int = default_values.DEFAULT_CHUNK_SIZE,
+    chunk_overlap: int = default_values.DEFAULT_CHUNK_OVERLAP,
+    k: int = default_values.DEFAULT_RETRIEVER_K,
+    azure_kwargs: Optional[Dict[str, str]] = None,
+    use_azure: bool = False,
+) -> Tuple[List[Document], BaseRetriever]:
+    return get_texts_and_multiretriever(
+        uploaded_file_bytes=uploaded_file_bytes,
+        openai_api_key=openai_api_key,
+        chunk_size=chunk_size,
+        chunk_overlap=chunk_overlap,
+        k=k,
+        azure_kwargs=azure_kwargs,
+        use_azure=use_azure,
+    )
+# --- Sidebar ---
+sidebar = st.sidebar
+with sidebar:
+    st.markdown("# Menu")
+    model = st.selectbox(
+        label="Chat Model",
+        options=default_values.SUPPORTED_MODELS,
+        index=default_values.SUPPORTED_MODELS.index(default_values.DEFAULT_MODEL),
+    )
+    st.session_state.provider = default_values.MODEL_DICT[model]
+    provider_api_key = (
+        default_values.PROVIDER_KEY_DICT.get(
+            st.session_state.provider,
+        )
+        or st.text_input(
+            f"{st.session_state.provider} API key",
+            type="password",
+        )
+        if st.session_state.provider != "Azure OpenAI"
+        else ""
+    )
+    if st.button("Clear message history"):
+        STMEMORY.clear()
+        st.session_state.trace_link = None
+        st.session_state.run_id = None
+    # --- Document Chat Options ---
+    with st.expander("Document Chat", expanded=False):
+        uploaded_file = st.file_uploader("Upload a PDF", type="pdf")
+        openai_api_key = (
+            provider_api_key
+            if st.session_state.provider == "OpenAI"
+            else default_values.OPENAI_API_KEY
+            or st.sidebar.text_input("OpenAI API Key: ", type="password")
+        )
+        document_chat = st.checkbox(
+            "Document Chat",
+            value=True if uploaded_file else False,
+            help="Uploaded document will provide context for the chat.",
+        )
+        k = st.slider(
+            label="Number of Chunks",
+            help="How many document chunks will be used for context?",
+            value=default_values.DEFAULT_RETRIEVER_K,
+            min_value=1,
+            max_value=10,
+        )
+        chunk_size = st.slider(
+            label="Number of Tokens per Chunk",
+            help="Size of each chunk of text",
+            min_value=default_values.MIN_CHUNK_SIZE,
+            max_value=default_values.MAX_CHUNK_SIZE,
+            value=default_values.DEFAULT_CHUNK_SIZE,
+        )
+        chunk_overlap = st.slider(
+            label="Chunk Overlap",
+            help="Number of characters to overlap between chunks",
+            min_value=default_values.MIN_CHUNK_OVERLAP,
+            max_value=default_values.MAX_CHUNK_OVERLAP,
+            value=default_values.DEFAULT_CHUNK_OVERLAP,
+        )
+        chain_type_help_root = (
+            "https://python.langchain.com/docs/modules/chains/document/"
+        )
+        chain_type_help = "\n".join(
+            f"- [{chain_type_name}]({chain_type_help_root}/{chain_type_name})"
+            for chain_type_name in (
+                "stuff",
+                "refine",
+                "map_reduce",
+                "map_rerank",
+            )
+        )
+        document_chat_chain_type = st.selectbox(
+            label="Document Chat Chain Type",
+            options=[
+                "stuff",
+                "refine",
+                "map_reduce",
+                "map_rerank",
+                "Q&A Generation",
+                "Summarization",
+            ],
+            index=0,
+            help=chain_type_help,
+        )
+        use_azure = st.toggle(
+            label="Use Azure OpenAI",
+            value=st.session_state.AZURE_EMB_AVAILABLE,
+            help="Use Azure for embeddings instead of using OpenAI directly.",
+        )
+        if uploaded_file:
+            if st.session_state.AZURE_EMB_AVAILABLE or openai_api_key:
+                (
+                    st.session_state.texts,
+                    st.session_state.retriever,
+                ) = get_texts_and_retriever_cacheable_wrapper(
+                    uploaded_file_bytes=uploaded_file.getvalue(),
+                    openai_api_key=openai_api_key,
+                    chunk_size=chunk_size,
+                    chunk_overlap=chunk_overlap,
+                    k=k,
+                    azure_kwargs=AZURE_KWARGS,
+                    use_azure=use_azure,
+                )
+            else:
+                st.error("Please enter a valid OpenAI API key.", icon="❌")
+    # --- Advanced Settings ---
+    with st.expander("Advanced Settings", expanded=False):
+        st.markdown("## Feedback Scale")
+        use_faces = st.toggle(label="`Thumbs` ⇄ `Faces`", value=False)
+        feedback_option = "faces" if use_faces else "thumbs"
+        system_prompt = (
+            st.text_area(
+                "Custom Instructions",
+                default_values.DEFAULT_SYSTEM_PROMPT,
+                help="Custom instructions to provide the language model to determine style, personality, etc.",
+            )
+            .strip()
+            .replace("{", "{{")
+            .replace("}", "}}")
+        )
+        temperature = st.slider(
+            "Temperature",
+            min_value=default_values.MIN_TEMP,
+            max_value=default_values.MAX_TEMP,
+            value=default_values.DEFAULT_TEMP,
+            help="Higher values give more random results.",
+        )
+        max_tokens = st.slider(
+            "Max Tokens",
+            min_value=default_values.MIN_MAX_TOKENS,
+            max_value=default_values.MAX_MAX_TOKENS,
+            value=default_values.DEFAULT_MAX_TOKENS,
+            help="Higher values give longer results.",
+        )
+    # --- LangSmith Options ---
+    if default_values.SHOW_LANGSMITH_OPTIONS:
+        with st.expander("LangSmith Options", expanded=False):
+            st.session_state.LANGSMITH_API_KEY = st.text_input(
+                "LangSmith API Key (optional)",
+                value=st.session_state.LANGSMITH_API_KEY,
+                type="password",
+            )
+            st.session_state.LANGSMITH_PROJECT = st.text_input(
+                "LangSmith Project Name",
+                value=st.session_state.LANGSMITH_PROJECT,
+            )
+    if st.session_state.client is None and st.session_state.LANGSMITH_API_KEY:
+        st.session_state.client = Client(
+            api_url="https://api.smith.langchain.com",
+            api_key=st.session_state.LANGSMITH_API_KEY,
+        )
+        st.session_state.ls_tracer = LangChainTracer(
+            project_name=st.session_state.LANGSMITH_PROJECT,
+            client=st.session_state.client,
+        )
+    # --- Azure Options ---
+    if default_values.SHOW_AZURE_OPTIONS:
+        with st.expander("Azure Options", expanded=False):
+            st.session_state.AZURE_OPENAI_BASE_URL = st.text_input(
+                "AZURE_OPENAI_BASE_URL",
+                value=st.session_state.AZURE_OPENAI_BASE_URL,
+            )
+            st.session_state.AZURE_OPENAI_API_VERSION = st.text_input(
+                "AZURE_OPENAI_API_VERSION",
+                value=st.session_state.AZURE_OPENAI_API_VERSION,
+            )
+            st.session_state.AZURE_OPENAI_DEPLOYMENT_NAME = st.text_input(
+                "AZURE_OPENAI_DEPLOYMENT_NAME",
+                value=st.session_state.AZURE_OPENAI_DEPLOYMENT_NAME,
+            )
+            st.session_state.AZURE_OPENAI_EMB_DEPLOYMENT_NAME = st.text_input(
+                "AZURE_OPENAI_EMB_DEPLOYMENT_NAME",
+                value=st.session_state.AZURE_OPENAI_EMB_DEPLOYMENT_NAME,
+            )
+            st.session_state.AZURE_OPENAI_API_KEY = st.text_input(
+                "AZURE_OPENAI_API_KEY",
+                value=st.session_state.AZURE_OPENAI_API_KEY,
+                type="password",
+            )
+            st.session_state.AZURE_OPENAI_MODEL_VERSION = st.text_input(
+                "AZURE_OPENAI_MODEL_VERSION",
+                value=st.session_state.AZURE_OPENAI_MODEL_VERSION,
+            )
+# --- LLM Instantiation ---
+get_llm_args = dict(
+    provider=st.session_state.provider,
+    model=model,
+    provider_api_key=provider_api_key,
+    temperature=temperature,
+    max_tokens=max_tokens,
+    azure_available=st.session_state.AZURE_AVAILABLE,
+    azure_dict={
+        "AZURE_OPENAI_BASE_URL": st.session_state.AZURE_OPENAI_BASE_URL,
+        "AZURE_OPENAI_API_VERSION": st.session_state.AZURE_OPENAI_API_VERSION,
+        "AZURE_OPENAI_DEPLOYMENT_NAME": st.session_state.AZURE_OPENAI_DEPLOYMENT_NAME,
+        "AZURE_OPENAI_API_KEY": st.session_state.AZURE_OPENAI_API_KEY,
+        "AZURE_OPENAI_MODEL_VERSION": st.session_state.AZURE_OPENAI_MODEL_VERSION,
+    },
+)
+get_llm_args_temp_zero = get_llm_args | {"temperature": 0.0}
+st.session_state.llm = get_llm(**get_llm_args)
+# --- Chat History ---
+for msg in STMEMORY.messages:
+    if msg.content and msg.type in ("ai", "assistant", "human", "user"):
+        st.chat_message(
+            msg.type,
+            avatar="🦜" if msg.type in ("ai", "assistant") else None,
+        ).write(msg.content)
+# --- Current Chat ---
+if st.session_state.llm:
+    # --- Regular Chat ---
+    chat_prompt = ChatPromptTemplate.from_messages(
+        [
+            (
+                "system",
+                system_prompt + "\nIt's currently {time}.",
+            ),
+            MessagesPlaceholder(variable_name="chat_history"),
+            ("human", "{query}"),
+        ],
+    ).partial(time=lambda: str(datetime.now()))
+    # --- Chat Input ---
+    prompt = st.chat_input(placeholder="Ask me a question!")
+    if prompt:
+        st.chat_message("user").write(prompt)
+        feedback_update = None
+        feedback = None
+        # --- Chat Output ---
+        with st.chat_message("assistant", avatar="🦜"):
+            callbacks = [RUN_COLLECTOR]
+            if st.session_state.ls_tracer:
+                callbacks.append(st.session_state.ls_tracer)
+            def get_config(callbacks: list[BaseCallbackHandler]) -> dict[str, Any]:
+                config: Dict[str, Any] = dict(
+                    callbacks=callbacks,
+                    tags=["Streamlit Chat"],
+                    verbose=True,
+                    return_intermediate_steps=False,
+                )
+                if st.session_state.provider == "Anthropic":
+                    config["max_concurrency"] = 5
+                return config
+            use_document_chat = all(
+                [
+                    document_chat,
+                    st.session_state.retriever,
+                ],
+            )
+            full_response: Union[str, None] = None
+            # stream_handler = StreamHandler(message_placeholder)
+            # callbacks.append(stream_handler)
+            message_placeholder = st.empty()
+            default_tools = [
+                DuckDuckGoSearchRun(),
+                WikipediaQueryRun(api_wrapper=WikipediaAPIWrapper()),
+            ]
+            default_tools += load_tools(["requests_get"])
+            default_tools += load_tools(["llm-math"], llm=st.session_state.llm)
+            if st.session_state.provider in ("Azure OpenAI", "OpenAI"):
+                research_assistant_chain = get_research_assistant_chain(
+                    search_llm=get_llm(**get_llm_args_temp_zero),  # type: ignore
+                    writer_llm=get_llm(**get_llm_args_temp_zero),  # type: ignore
+                )
+                st_callback = StreamlitCallbackHandler(st.container())
+                callbacks.append(st_callback)
+                @tool("web-research-assistant")
+                def research_assistant_tool(question: str, callbacks: Callbacks = None):
+                    """This assistant returns a comprehensive report based on web research.
+                    It's slow and relatively expensive, so use it sparingly.
+                    Consider using a different tool for quick facts or web queries.
+                    """
+                    return research_assistant_chain.invoke(
+                        dict(question=question),
+                        config=get_config(callbacks),
+                    )
+                python_coder_agent = get_python_agent(st.session_state.llm)
+                @tool("python-coder-assistant")
+                def python_coder_tool(input_str: str, callbacks: Callbacks = None):
+                    """This assistant writes PYTHON code.
+                    Give it clear instructions and requirements.
+                    Do not use it for tasks other than Python.
+                    """
+                    return python_coder_agent.invoke(
+                        dict(input=input_str),
+                        config=get_config(callbacks),
+                    )
+                TOOLS = [research_assistant_tool, python_coder_tool] + default_tools
+                if use_document_chat:
+                    st.session_state.doc_chain = get_runnable(
+                        use_document_chat,
+                        document_chat_chain_type,
+                        st.session_state.llm,
+                        st.session_state.retriever,
+                        MEMORY,
+                        chat_prompt,
+                        prompt,
+                    )
+                    @tool("user-document-chat")
+                    def doc_chain_tool(input_str: str, callbacks: Callbacks = None):
+                        """Always use this tool at least once. Input should be a question."""
+                        return st.session_state.doc_chain.invoke(
+                            input_str,
+                            config=get_config(callbacks),
+                        )
+                    doc_chain_agent = get_doc_agent(
+                        [doc_chain_tool],
+                    )
+                    @tool("document-question-tool")
+                    def doc_question_tool(input_str: str, callbacks: Callbacks = None):
+                        """This tool is an AI assistant with access to the user's uploaded document.
+                        Input should be one or more questions, requests, instructions, etc.
+                        If the user's meaning is unclear, perhaps the answer is here.
+                        Generally speaking, try this tool before conducting web research.
+                        """
+                        return doc_chain_agent.invoke(
+                            input_str,
+                            config=get_config(callbacks),
+                        )
+                    TOOLS = [doc_question_tool] + TOOLS
+                st.session_state.chain = get_agent(
+                    TOOLS,
+                    STMEMORY,
+                    st.session_state.llm,
+                    callbacks,
+                )
+            else:
+                st.session_state.chain = get_runnable(
+                    use_document_chat,
+                    document_chat_chain_type,
+                    st.session_state.llm,
+                    st.session_state.retriever,
+                    MEMORY,
+                    chat_prompt,
+                    prompt,
+                )
+            # --- LLM call ---
+            try:
+                full_response = st.session_state.chain.invoke(
+                    prompt,
+                    config=get_config(callbacks),
+                )
+            except (openai.AuthenticationError, anthropic.AuthenticationError):
+                st.error(
+                    f"Please enter a valid {st.session_state.provider} API key.",
+                    icon="❌",
+                )
+            # --- Display output ---
+            if full_response is not None:
+                message_placeholder.markdown(full_response)
+                # --- Tracing ---
+                if st.session_state.client:
+                    st.session_state.run = RUN_COLLECTOR.traced_runs[0]
+                    st.session_state.run_id = st.session_state.run.id
+                    RUN_COLLECTOR.traced_runs = []
+                    wait_for_all_tracers()
+                    try:
+                        st.session_state.trace_link = st.session_state.client.read_run(
+                            st.session_state.run_id,
+                        ).url
+                    except (
+                        langsmith.utils.LangSmithError,
+                        langsmith.utils.LangSmithNotFoundError,
+                    ):
+                        st.session_state.trace_link = None
+    # --- LangSmith Trace Link ---
+    if st.session_state.trace_link:
+        with sidebar:
+            st.markdown(
+                f'<a href="{st.session_state.trace_link}" target="_blank"><button>Latest Trace: 🛠️</button></a>',
+                unsafe_allow_html=True,
+            )
+    # --- Feedback ---
+    if st.session_state.client and st.session_state.run_id:
+        feedback = streamlit_feedback(
+            feedback_type=feedback_option,
+            optional_text_label="[Optional] Please provide an explanation",
+            key=f"feedback_{st.session_state.run_id}",
+        )
+        # Define score mappings for both "thumbs" and "faces" feedback systems
+        score_mappings: dict[str, dict[str, Union[int, float]]] = {
+            "thumbs": {"👍": 1, "👎": 0},
+            "faces": {"😀": 1, "🙂": 0.75, "😐": 0.5, "🙁": 0.25, "😞": 0},
+        }
+        # Get the score mapping based on the selected feedback option
+        scores = score_mappings[feedback_option]
+        if feedback:
+            # Get the score from the selected feedback option's score mapping
+            score = scores.get(
+                feedback["score"],
+            )
+            if score is not None:
+                # Formulate feedback type string incorporating the feedback option
+                # and score value
+                feedback_type_str = f"{feedback_option} {feedback['score']}"
+                # Record the feedback with the formulated feedback type string
+                # and optional comment
+                feedback_record = st.session_state.client.create_feedback(
+                    st.session_state.run_id,
+                    feedback_type_str,
+                    score=score,
+                    comment=feedback.get("text"),
+                )
+                st.toast("Feedback recorded!", icon="📝")
+            else:
+                st.warning("Invalid feedback score.")
+else:
+    st.error(f"Please enter a valid {st.session_state.provider} API key.", icon="❌")

langchain-streamlit-demo/defaults.py ADDED Viewed

	@@ -0,0 +1,134 @@

+import os
+from collections import namedtuple
+MODEL_DICT = {
+    "gpt-3.5-turbo": "OpenAI",
+    "gpt-4": "OpenAI",
+    "gpt-4-1106-preview": "OpenAI",
+    "claude-instant-1": "Anthropic",
+    "claude-instant-1.2": "Anthropic",
+    "claude-2": "Anthropic",
+    "claude-2.1": "Anthropic",
+    "meta-llama/Llama-2-7b-chat-hf": "Anyscale Endpoints",
+    "meta-llama/Llama-2-13b-chat-hf": "Anyscale Endpoints",
+    "meta-llama/Llama-2-70b-chat-hf": "Anyscale Endpoints",
+    "codellama/CodeLlama-34b-Instruct-hf": "Anyscale Endpoints",
+    "mistralai/Mistral-7B-Instruct-v0.1": "Anyscale Endpoints",
+    "HuggingFaceH4/zephyr-7b-beta": "Anyscale Endpoints",
+    "Azure OpenAI": "Azure OpenAI",
+}
+SUPPORTED_MODELS = list(MODEL_DICT.keys())
+DEFAULT_MODEL = os.environ.get("DEFAULT_MODEL", "gpt-3.5-turbo")
+DEFAULT_SYSTEM_PROMPT = os.environ.get(
+    "DEFAULT_SYSTEM_PROMPT",
+    "You are a helpful chatbot. Do not rush. Always plan, think, and act in a step-by-step manner.",
+)
+MIN_TEMP = float(os.environ.get("MIN_TEMPERATURE", 0.0))
+MAX_TEMP = float(os.environ.get("MAX_TEMPERATURE", 1.0))
+DEFAULT_TEMP = float(os.environ.get("DEFAULT_TEMPERATURE", 0.7))
+MIN_MAX_TOKENS = int(os.environ.get("MIN_MAX_TOKENS", 1))
+MAX_MAX_TOKENS = int(os.environ.get("MAX_MAX_TOKENS", 100000))
+DEFAULT_MAX_TOKENS = int(os.environ.get("DEFAULT_MAX_TOKENS", 1000))
+DEFAULT_LANGSMITH_PROJECT = os.environ.get("LANGCHAIN_PROJECT")
+AZURE_VARS = [
+    "AZURE_OPENAI_BASE_URL",
+    "AZURE_OPENAI_API_VERSION",
+    "AZURE_OPENAI_DEPLOYMENT_NAME",
+    "AZURE_OPENAI_EMB_DEPLOYMENT_NAME",
+    "AZURE_OPENAI_API_KEY",
+    "AZURE_OPENAI_MODEL_VERSION",
+]
+AZURE_DICT = {v: os.environ.get(v, "") for v in AZURE_VARS}
+SHOW_LANGSMITH_OPTIONS = (
+    os.environ.get("SHOW_LANGSMITH_OPTIONS", "true").lower() == "true"
+)
+SHOW_AZURE_OPTIONS = os.environ.get("SHOW_AZURE_OPTIONS", "true").lower() == "true"
+PROVIDER_KEY_DICT = {
+    "OpenAI": os.environ.get("OPENAI_API_KEY", ""),
+    "Anthropic": os.environ.get("ANTHROPIC_API_KEY", ""),
+    "Anyscale Endpoints": os.environ.get("ANYSCALE_API_KEY", ""),
+    "LANGSMITH": os.environ.get("LANGCHAIN_API_KEY", ""),
+}
+OPENAI_API_KEY = PROVIDER_KEY_DICT["OpenAI"]
+MIN_CHUNK_SIZE = 1
+MAX_CHUNK_SIZE = 10000
+DEFAULT_CHUNK_SIZE = 1000
+MIN_CHUNK_OVERLAP = 0
+MAX_CHUNK_OVERLAP = 10000
+DEFAULT_CHUNK_OVERLAP = 0
+DEFAULT_RETRIEVER_K = 4
+DEFAULT_VALUES = namedtuple(
+    "DEFAULT_VALUES",
+    [
+        "MODEL_DICT",
+        "SUPPORTED_MODELS",
+        "DEFAULT_MODEL",
+        "DEFAULT_SYSTEM_PROMPT",
+        "MIN_TEMP",
+        "MAX_TEMP",
+        "DEFAULT_TEMP",
+        "MIN_MAX_TOKENS",
+        "MAX_MAX_TOKENS",
+        "DEFAULT_MAX_TOKENS",
+        "DEFAULT_LANGSMITH_PROJECT",
+        "AZURE_VARS",
+        "AZURE_DICT",
+        "PROVIDER_KEY_DICT",
+        "OPENAI_API_KEY",
+        "MIN_CHUNK_SIZE",
+        "MAX_CHUNK_SIZE",
+        "DEFAULT_CHUNK_SIZE",
+        "MIN_CHUNK_OVERLAP",
+        "MAX_CHUNK_OVERLAP",
+        "DEFAULT_CHUNK_OVERLAP",
+        "DEFAULT_RETRIEVER_K",
+        "SHOW_LANGSMITH_OPTIONS",
+        "SHOW_AZURE_OPTIONS",
+    ],
+)
+default_values = DEFAULT_VALUES(
+    MODEL_DICT,
+    SUPPORTED_MODELS,
+    DEFAULT_MODEL,
+    DEFAULT_SYSTEM_PROMPT,
+    MIN_TEMP,
+    MAX_TEMP,
+    DEFAULT_TEMP,
+    MIN_MAX_TOKENS,
+    MAX_MAX_TOKENS,
+    DEFAULT_MAX_TOKENS,
+    DEFAULT_LANGSMITH_PROJECT,
+    AZURE_VARS,
+    AZURE_DICT,
+    PROVIDER_KEY_DICT,
+    OPENAI_API_KEY,
+    MIN_CHUNK_SIZE,
+    MAX_CHUNK_SIZE,
+    DEFAULT_CHUNK_SIZE,
+    MIN_CHUNK_OVERLAP,
+    MAX_CHUNK_OVERLAP,
+    DEFAULT_CHUNK_OVERLAP,
+    DEFAULT_RETRIEVER_K,
+    SHOW_LANGSMITH_OPTIONS,
+    SHOW_AZURE_OPTIONS,
+)

langchain-streamlit-demo/llm_resources.py ADDED Viewed

	@@ -0,0 +1,294 @@

+import uuid
+from tempfile import NamedTemporaryFile
+from typing import Tuple, List, Optional, Dict
+from langchain.agents import AgentExecutor, AgentType, initialize_agent
+from langchain.agents.openai_functions_agent.base import OpenAIFunctionsAgent
+from langchain.callbacks.base import BaseCallbackHandler
+from langchain.chains import LLMChain
+from langchain.chains import RetrievalQA
+from langchain.chat_models import (
+    AzureChatOpenAI,
+    ChatOpenAI,
+    ChatAnthropic,
+    ChatAnyscale,
+)
+from langchain.document_loaders import PyPDFLoader
+from langchain.embeddings import AzureOpenAIEmbeddings, OpenAIEmbeddings
+from langchain.llms.base import BaseLLM
+from langchain.memory import ConversationBufferMemory
+from langchain.prompts import MessagesPlaceholder, ChatPromptTemplate
+from langchain.retrievers import EnsembleRetriever
+from langchain.retrievers.multi_query import MultiQueryRetriever
+from langchain.retrievers.multi_vector import MultiVectorRetriever
+from langchain.schema import Document, BaseRetriever
+from langchain.schema.chat_history import BaseChatMessageHistory
+from langchain.schema.runnable import RunnablePassthrough
+from langchain.storage import InMemoryStore
+from langchain.text_splitter import RecursiveCharacterTextSplitter
+from langchain.tools.base import BaseTool
+from langchain.vectorstores import FAISS
+from langchain_core.messages import SystemMessage
+from defaults import DEFAULT_CHUNK_SIZE, DEFAULT_CHUNK_OVERLAP, DEFAULT_RETRIEVER_K
+from qagen import get_rag_qa_gen_chain
+from summarize import get_rag_summarization_chain
+def get_agent(
+    tools: list[BaseTool],
+    chat_history: BaseChatMessageHistory,
+    llm: BaseLLM,
+    callbacks,
+):
+    memory_key = "agent_history"
+    system_message = SystemMessage(
+        content=(
+            "Do your best to answer the questions. "
+            "Feel free to use any tools available to look up "
+            "relevant information, only if necessary"
+        ),
+    )
+    prompt = OpenAIFunctionsAgent.create_prompt(
+        system_message=system_message,
+        extra_prompt_messages=[MessagesPlaceholder(variable_name=memory_key)],
+    )
+    agent = OpenAIFunctionsAgent(llm=llm, tools=tools, prompt=prompt)
+    # agent_memory = AgentTokenBufferMemory(
+    #     chat_memory=chat_history,
+    #     memory_key=memory_key,
+    #     llm=llm,
+    # )
+    agent_memory = ConversationBufferMemory(
+        chat_memory=chat_history,
+        return_messages=True,
+        memory_key=memory_key,
+    )
+    agent_executor = AgentExecutor(
+        agent=agent,
+        tools=tools,
+        memory=agent_memory,
+        verbose=True,
+        return_intermediate_steps=False,
+        callbacks=callbacks,
+    )
+    return (
+        {"input": RunnablePassthrough()}
+        | agent_executor
+        | (lambda output: output["output"])
+    )
+def get_doc_agent(
+    tools: list[BaseTool],
+    llm: Optional[BaseLLM] = None,
+    agent_type: AgentType = AgentType.CHAT_ZERO_SHOT_REACT_DESCRIPTION,
+):
+    if llm is None:
+        llm = ChatOpenAI(
+            model_name="gpt-4-1106-preview",
+            temperature=0.0,
+            streaming=True,
+        )
+    prompt = ChatPromptTemplate.from_messages(
+        [
+            (
+                "system",
+                """
+                You assist a chatbot with answering questions about a document.
+                If necessary, break up incoming questions into multiple parts,
+                and use the tools provided to answer smaller questions before
+                answering the larger question.
+                """,
+            ),
+            ("user", "{input}"),
+            MessagesPlaceholder(variable_name="agent_scratchpad"),
+        ],
+    )
+    agent_executor = initialize_agent(
+        tools,
+        llm,
+        agent=agent_type,
+        verbose=True,
+        memory=None,
+        handle_parsing_errors=True,
+        prompt=prompt,
+    )
+    return (
+        {"input": RunnablePassthrough()}
+        | agent_executor
+        | (lambda output: output["output"])
+    )
+def get_runnable(
+    use_document_chat: bool,
+    document_chat_chain_type: str,
+    llm,
+    retriever,
+    memory,
+    chat_prompt,
+    summarization_prompt,
+):
+    if not use_document_chat:
+        return LLMChain(
+            prompt=chat_prompt,
+            llm=llm,
+            memory=memory,
+        ) | (lambda output: output["text"])
+    if document_chat_chain_type == "Q&A Generation":
+        return get_rag_qa_gen_chain(
+            retriever,
+            llm,
+        )
+    elif document_chat_chain_type == "Summarization":
+        return get_rag_summarization_chain(
+            summarization_prompt,
+            retriever,
+            llm,
+        )
+    else:
+        return RetrievalQA.from_chain_type(
+            llm=llm,
+            chain_type=document_chat_chain_type,
+            retriever=retriever,
+            output_key="output_text",
+        ) | (lambda output: output["output_text"])
+def get_llm(
+    provider: str,
+    model: str,
+    provider_api_key: str,
+    temperature: float,
+    max_tokens: int,
+    azure_available: bool,
+    azure_dict: dict[str, str],
+):
+    if azure_available and provider == "Azure OpenAI":
+        return AzureChatOpenAI(
+            azure_endpoint=azure_dict["AZURE_OPENAI_BASE_URL"],
+            openai_api_version=azure_dict["AZURE_OPENAI_API_VERSION"],
+            deployment_name=azure_dict["AZURE_OPENAI_DEPLOYMENT_NAME"],
+            openai_api_key=azure_dict["AZURE_OPENAI_API_KEY"],
+            openai_api_type="azure",
+            model_version=azure_dict["AZURE_OPENAI_MODEL_VERSION"],
+            temperature=temperature,
+            streaming=True,
+            max_tokens=max_tokens,
+        )
+    elif provider_api_key:
+        if provider == "OpenAI":
+            return ChatOpenAI(
+                model_name=model,
+                openai_api_key=provider_api_key,
+                temperature=temperature,
+                streaming=True,
+                max_tokens=max_tokens,
+            )
+        elif provider == "Anthropic":
+            return ChatAnthropic(
+                model=model,
+                anthropic_api_key=provider_api_key,
+                temperature=temperature,
+                streaming=True,
+                max_tokens_to_sample=max_tokens,
+            )
+        elif provider == "Anyscale Endpoints":
+            return ChatAnyscale(
+                model_name=model,
+                anyscale_api_key=provider_api_key,
+                temperature=temperature,
+                streaming=True,
+                max_tokens=max_tokens,
+            )
+    return None
+def get_texts_and_multiretriever(
+    uploaded_file_bytes: bytes,
+    openai_api_key: str,
+    chunk_size: int = DEFAULT_CHUNK_SIZE,
+    chunk_overlap: int = DEFAULT_CHUNK_OVERLAP,
+    k: int = DEFAULT_RETRIEVER_K,
+    azure_kwargs: Optional[Dict[str, str]] = None,
+    use_azure: bool = False,
+) -> Tuple[List[Document], BaseRetriever]:
+    with NamedTemporaryFile() as temp_file:
+        temp_file.write(uploaded_file_bytes)
+        temp_file.seek(0)
+        loader = PyPDFLoader(temp_file.name)
+        documents = loader.load()
+        text_splitter = RecursiveCharacterTextSplitter(
+            chunk_size=10000,
+            chunk_overlap=0,
+        )
+        child_text_splitter = RecursiveCharacterTextSplitter(chunk_size=400)
+        texts = text_splitter.split_documents(documents)
+        id_key = "doc_id"
+        text_ids = [str(uuid.uuid4()) for _ in texts]
+        sub_texts = []
+        for i, text in enumerate(texts):
+            _id = text_ids[i]
+            _sub_texts = child_text_splitter.split_documents([text])
+            for _text in _sub_texts:
+                _text.metadata[id_key] = _id
+            sub_texts.extend(_sub_texts)
+        embeddings_kwargs = {"openai_api_key": openai_api_key}
+        if use_azure and azure_kwargs:
+            azure_kwargs["azure_endpoint"] = azure_kwargs.pop("openai_api_base")
+            embeddings_kwargs.update(azure_kwargs)
+            embeddings = AzureOpenAIEmbeddings(**embeddings_kwargs)
+        else:
+            embeddings = OpenAIEmbeddings(**embeddings_kwargs)
+        store = InMemoryStore()
+        # MultiVectorRetriever
+        multivectorstore = FAISS.from_documents(sub_texts, embeddings)
+        multivector_retriever = MultiVectorRetriever(
+            vectorstore=multivectorstore,
+            docstore=store,
+            id_key=id_key,
+        )
+        multivector_retriever.docstore.mset(list(zip(text_ids, texts)))
+        # multivector_retriever.k = k
+        multiquery_text_splitter = RecursiveCharacterTextSplitter(
+            chunk_size=chunk_size,
+            chunk_overlap=chunk_overlap,
+        )
+        # MultiQueryRetriever
+        multiquery_texts = multiquery_text_splitter.split_documents(documents)
+        multiquerystore = FAISS.from_documents(multiquery_texts, embeddings)
+        multiquery_retriever = MultiQueryRetriever.from_llm(
+            retriever=multiquerystore.as_retriever(search_kwargs={"k": k}),
+            llm=ChatOpenAI(),
+        )
+        ensemble_retriever = EnsembleRetriever(
+            retrievers=[multiquery_retriever, multivector_retriever],
+            weights=[0.5, 0.5],
+        )
+        return multiquery_texts, ensemble_retriever
+class StreamHandler(BaseCallbackHandler):
+    def __init__(self, container, initial_text=""):
+        self.container = container
+        self.text = initial_text
+    def on_llm_new_token(self, token: str, **kwargs) -> None:
+        self.text += token
+        self.container.markdown(self.text)

langchain-streamlit-demo/python_coder.py ADDED Viewed

	@@ -0,0 +1,193 @@

+"""langchain python coder-- requires black, ruff, and mypy."""
+import os
+import re
+import subprocess  # nosec
+import tempfile
+from langchain.agents import initialize_agent, AgentType
+from langchain.agents.tools import Tool
+from langchain.llms.base import BaseLLM
+from langchain.memory import ConversationBufferMemory
+from langchain.prompts import ChatPromptTemplate
+from langchain.prompts import MessagesPlaceholder
+from langchain.pydantic_v1 import BaseModel, validator, Field, ValidationError
+def strip_python_markdown_tags(text: str) -> str:
+    pat = re.compile(r"```python\n(.*)```", re.DOTALL)
+    code = pat.match(text)
+    if code:
+        return code.group(1)
+    else:
+        return text
+def format_black(filepath: str):
+    """Format a file with black."""
+    subprocess.run(  # nosec
+        f"black {filepath}",
+        stderr=subprocess.STDOUT,
+        text=True,
+        shell=True,
+        timeout=30,
+        check=False,
+    )
+def format_ruff(filepath: str):
+    """Run ruff format on a file."""
+    subprocess.run(  # nosec
+        f"ruff check --no-cache --fix {filepath}",
+        shell=True,
+        text=True,
+        timeout=30,
+        universal_newlines=True,
+        check=False,
+    )
+    subprocess.run(  # nosec
+        f"ruff format --no-cache {filepath}",
+        stderr=subprocess.STDOUT,
+        shell=True,
+        timeout=30,
+        text=True,
+        check=False,
+    )
+def check_ruff(filepath: str):
+    """Run ruff check on a file."""
+    subprocess.check_output(  # nosec
+        f"ruff check --no-cache {filepath}",
+        stderr=subprocess.STDOUT,
+        shell=True,
+        timeout=30,
+        text=True,
+    )
+def check_mypy(filepath: str, strict: bool = False, follow_imports: str = "skip"):
+    """Run mypy on a file."""
+    cmd = f"mypy {'--strict' if strict else ''} --follow-imports={follow_imports} {filepath}"
+    subprocess.check_output(  # nosec
+        cmd,
+        stderr=subprocess.STDOUT,
+        shell=True,
+        text=True,
+        timeout=30,
+    )
+class PythonCode(BaseModel):
+    code: str = Field(
+        description="Python code conforming to ruff, black, and *strict* mypy standards.",
+    )
+    @validator("code")
+    @classmethod
+    def check_code(cls, v: str) -> str:
+        v = strip_python_markdown_tags(v).strip()
+        try:
+            with tempfile.NamedTemporaryFile(mode="w", delete=False) as temp_file:
+                temp_file.write(v)
+                temp_file_path = temp_file.name
+            try:
+                # format with black and ruff
+                format_black(temp_file_path)
+                format_ruff(temp_file_path)
+            except subprocess.CalledProcessError:
+                pass
+            # update `v` with formatted code
+            with open(temp_file_path, "r") as temp_file:
+                v = temp_file.read()
+            # check
+            complaints = dict(ruff=None, mypy=None)
+            try:
+                check_ruff(temp_file_path)
+            except subprocess.CalledProcessError as e:
+                complaints["ruff"] = e.output
+            try:
+                check_mypy(temp_file_path)
+            except subprocess.CalledProcessError as e:
+                complaints["mypy"] = e.output
+            # raise ValueError if ruff or mypy had complaints
+            if any(complaints.values()):
+                code_str = f"```{temp_file_path}\n{v}```"
+                error_messages = [
+                    f"```{key}\n{value}```"
+                    for key, value in complaints.items()
+                    if value
+                ]
+                raise ValueError("\n\n".join([code_str] + error_messages))
+        finally:
+            os.remove(temp_file_path)
+        return v
+def check_code(code: str) -> str:
+    try:
+        code_obj = PythonCode(code=code)
+        return f"# LGTM\n# use the `submit` tool to submit this code:\n\n```python\n{code_obj.code}\n```"
+    except ValidationError as e:
+        return e.errors()[0]["msg"]
+prompt = ChatPromptTemplate.from_messages(
+    [
+        (
+            "system",
+            "You are a world class Python coder who uses black, ruff, and *strict* mypy for all of your code. "
+            "Provide complete, end-to-end Python code to meet the user's description/requirements. "
+            "Always `check` your code. When you're done, you must ALWAYS use the `submit` tool.",
+        ),
+        MessagesPlaceholder(variable_name="chat_history"),
+        (
+            "human",
+            "{input}",
+        ),
+    ],
+)
+check_code_tool = Tool.from_function(
+    check_code,
+    name="check-code",
+    description="Always check your code before submitting it!",
+)
+submit_code_tool = Tool.from_function(
+    lambda s: strip_python_markdown_tags(s),
+    name="submit-code",
+    description="THIS TOOL is the most important. use it to submit your code to the user who requested it... but be sure to `check` it first!",
+    return_direct=True,
+)
+tools = [check_code_tool, submit_code_tool]
+def get_agent(
+    llm: BaseLLM,
+    agent_type: AgentType = AgentType.CHAT_CONVERSATIONAL_REACT_DESCRIPTION,
+):
+    agent_memory = ConversationBufferMemory(
+        return_messages=True,
+        memory_key="chat_history",
+    )
+    return initialize_agent(
+        tools,
+        llm,
+        agent=agent_type,
+        verbose=True,
+        handle_parsing_errors=True,
+        memory=agent_memory,
+        prompt=prompt,
+        return_intermediate_steps=False,
+    ) | (lambda output: output["output"])

langchain-streamlit-demo/qagen.py ADDED Viewed

	@@ -0,0 +1,72 @@

+from typing import List
+from langchain.output_parsers import PydanticOutputParser, OutputFixingParser
+from langchain.prompts.chat import (
+    ChatPromptTemplate,
+)
+from langchain.schema.language_model import BaseLanguageModel
+from langchain.schema.retriever import BaseRetriever
+from langchain.schema.runnable import RunnablePassthrough, RunnableSequence
+from pydantic import BaseModel, Field
+class QuestionAnswerPair(BaseModel):
+    question: str = Field(..., description="The question that will be answered.")
+    answer: str = Field(..., description="The answer to the question that was asked.")
+    def to_str(self, idx: int) -> str:
+        question_piece = f"{idx}. **Q:** {self.question}"
+        whitespace = " " * (len(str(idx)) + 2)
+        answer_piece = f"{whitespace}**A:** {self.answer}"
+        return f"{question_piece}\n\n{answer_piece}"
+class QuestionAnswerPairList(BaseModel):
+    QuestionAnswerPairs: List[QuestionAnswerPair]
+    def to_str(self) -> str:
+        return "\n\n".join(
+            [
+                qap.to_str(idx)
+                for idx, qap in enumerate(self.QuestionAnswerPairs, start=1)
+            ],
+        )
+PYDANTIC_PARSER: PydanticOutputParser = PydanticOutputParser(
+    pydantic_object=QuestionAnswerPairList,
+)
+templ1 = """You are a smart assistant designed to help college professors come up with reading comprehension questions.
+Given a piece of text, you must come up with question and answer pairs that can be used to test a student's reading comprehension abilities.
+Generate as many question/answer pairs as you can.
+When coming up with the question/answer pairs, you must respond in the following format:
+{format_instructions}
+Do not provide additional commentary and do not wrap your response in Markdown formatting. Return RAW, VALID JSON.
+"""
+templ2 = """{prompt}
+Please create question/answer pairs, in the specified JSON format, for the following text:
+----------------
+{context}"""
+CHAT_PROMPT = ChatPromptTemplate.from_messages(
+    [
+        ("system", templ1),
+        ("human", templ2),
+    ],
+).partial(format_instructions=PYDANTIC_PARSER.get_format_instructions)
+def get_rag_qa_gen_chain(
+    retriever: BaseRetriever,
+    llm: BaseLanguageModel,
+    input_key: str = "prompt",
+) -> RunnableSequence:
+    return (
+        {"context": retriever, input_key: RunnablePassthrough()}
+        | CHAT_PROMPT
+        | llm
+        | OutputFixingParser.from_llm(llm=llm, parser=PYDANTIC_PARSER)
+        | (lambda parsed_output: parsed_output.to_str())
+    )

langchain-streamlit-demo/research_assistant/__init__.py ADDED Viewed

	@@ -0,0 +1,3 @@


1	+ from research_assistant.chain import get_chain
2	+
3	+ __all__ = ["get_chain"]

langchain-streamlit-demo/research_assistant/chain.py ADDED Viewed

	@@ -0,0 +1,18 @@

+from langchain_core.pydantic_v1 import BaseModel
+from langchain_core.runnables import RunnablePassthrough
+from research_assistant.search.web import get_search_chain
+from research_assistant.writer import get_writer_chain
+from langchain.llms.base import BaseLLM
+from langchain.schema.runnable import Runnable
+def get_chain(search_llm: BaseLLM, writer_llm: BaseLLM) -> Runnable:
+    chain_notypes = RunnablePassthrough().assign(
+        research_summary=get_search_chain(search_llm),
+    ) | get_writer_chain(writer_llm)
+    class InputType(BaseModel):
+        question: str
+    return chain_notypes.with_types(input_type=InputType)

langchain-streamlit-demo/research_assistant/search/__init__.py ADDED Viewed

File without changes

langchain-streamlit-demo/research_assistant/search/web.py ADDED Viewed

	@@ -0,0 +1,178 @@

+import json
+from typing import Any
+import requests
+from bs4 import BeautifulSoup
+from langchain.llms.base import BaseLLM
+from langchain.prompts import ChatPromptTemplate
+from langchain.retrievers.tavily_search_api import TavilySearchAPIRetriever
+from langchain.utilities import DuckDuckGoSearchAPIWrapper
+from langchain_core.messages import SystemMessage
+from langchain_core.output_parsers import StrOutputParser
+from langchain_core.runnables import (
+    ConfigurableField,
+    Runnable,
+    RunnableLambda,
+    RunnableParallel,
+    RunnablePassthrough,
+)
+RESULTS_PER_QUESTION = 3
+ddg_search = DuckDuckGoSearchAPIWrapper()
+def scrape_text(url: str):
+    # Send a GET request to the webpage
+    try:
+        response = requests.get(url)
+        # Check if the request was successful
+        if response.status_code == 200:
+            # Parse the content of the request with BeautifulSoup
+            soup = BeautifulSoup(response.text, "html.parser")
+            # Extract all text from the webpage
+            page_text = soup.get_text(separator=" ", strip=True)
+            # Print the extracted text
+            return page_text
+        else:
+            return f"Failed to retrieve the webpage: Status code {response.status_code}"
+    except Exception as e:
+        print(e)
+        return f"Failed to retrieve the webpage: {e}"
+def web_search(query: str, num_results: int):
+    results = ddg_search.results(query, num_results)
+    return [r["link"] for r in results]
+get_links: Runnable[Any, Any] = (
+    RunnablePassthrough()
+    | RunnableLambda(
+        lambda x: [
+            {"url": url, "question": x["question"]}
+            for url in web_search(query=x["question"], num_results=RESULTS_PER_QUESTION)
+        ],
+    )
+).configurable_alternatives(
+    ConfigurableField("search_engine"),
+    default_key="duckduckgo",
+    tavily=RunnableLambda(lambda x: x["question"])
+    | RunnableParallel(
+        {
+            "question": RunnablePassthrough(),
+            "results": TavilySearchAPIRetriever(k=RESULTS_PER_QUESTION),
+        },
+    )
+    | RunnableLambda(
+        lambda x: [
+            {"url": result.metadata["source"], "question": x["question"]}
+            for result in x["results"]
+        ],
+    ),
+)
+SEARCH_PROMPT = ChatPromptTemplate.from_messages(
+    [
+        ("system", "{agent_prompt}"),
+        (
+            "user",
+            "Write 3 google search queries to search online that form an "
+            "objective opinion from the following: {question}\n"
+            "You must respond with a list of strings in the following format: "
+            '["query 1", "query 2", "query 3"].',
+        ),
+    ],
+)
+AUTO_AGENT_INSTRUCTIONS = """
+This task involves researching a given topic, regardless of its complexity or the availability of a definitive answer. The research is conducted by a specific agent, defined by its type and role, with each agent requiring distinct instructions.
+Agent
+The agent is determined by the field of the topic and the specific name of the agent that could be utilized to research the topic provided. Agents are categorized by their area of expertise, and each agent type is associated with a corresponding emoji.
+examples:
+task: "should I invest in apple stocks?"
+response:
+{
+    "agent": "💰 Finance Agent",
+    "agent_role_prompt: "You are a seasoned finance analyst AI assistant. Your primary goal is to compose comprehensive, astute, impartial, and methodically arranged financial reports based on provided data and trends."
+}
+task: "could reselling sneakers become profitable?"
+response:
+{
+    "agent":  "📈 Business Analyst Agent",
+    "agent_role_prompt": "You are an experienced AI business analyst assistant. Your main objective is to produce comprehensive, insightful, impartial, and systematically structured business reports based on provided business data, market trends, and strategic analysis."
+}
+task: "what are the most interesting sites in Tel Aviv?"
+response:
+{
+    "agent:  "🌍 Travel Agent",
+    "agent_role_prompt": "You are a world-travelled AI tour guide assistant. Your main purpose is to draft engaging, insightful, unbiased, and well-structured travel reports on given locations, including history, attractions, and cultural insights."
+}
+"""  # noqa: E501
+CHOOSE_AGENT_PROMPT = ChatPromptTemplate.from_messages(
+    [SystemMessage(content=AUTO_AGENT_INSTRUCTIONS), ("user", "task: {task}")],
+)
+SUMMARY_TEMPLATE = """{text}
+-----------
+Using the above text, answer in short the following question:
+> {question}
+-----------
+if the question cannot be answered using the text, imply summarize the text. Include all factual information, numbers, stats etc if available."""  # noqa: E501
+SUMMARY_PROMPT = ChatPromptTemplate.from_template(SUMMARY_TEMPLATE)
+def load_json(s):
+    try:
+        return json.loads(s)
+    except Exception:
+        return {}
+def get_search_chain(model: BaseLLM) -> Runnable:
+    scrape_and_summarize: Runnable[Any, Any] = (
+        RunnableParallel(
+            {
+                "question": lambda x: x["question"],
+                "text": lambda x: scrape_text(x["url"])[:10000],
+                "url": lambda x: x["url"],
+            },
+        )
+        | RunnableParallel(
+            {
+                "summary": SUMMARY_PROMPT | model | StrOutputParser(),
+                "url": lambda x: x["url"],
+            },
+        )
+        | RunnableLambda(lambda x: f"Source Url: {x['url']}\nSummary: {x['summary']}")
+    )
+    multi_search = get_links | scrape_and_summarize.map() | (lambda x: "\n".join(x))
+    search_query = SEARCH_PROMPT | model | StrOutputParser() | load_json
+    choose_agent = CHOOSE_AGENT_PROMPT | model | StrOutputParser() | load_json
+    get_search_queries = (
+        RunnablePassthrough().assign(
+            agent_prompt=RunnableParallel({"task": lambda x: x})
+            | choose_agent
+            | (lambda x: x.get("agent_role_prompt")),
+        )
+        | search_query
+    )
+    return (
+        get_search_queries
+        | (lambda x: [{"question": q} for q in x])
+        | multi_search.map()
+        | (lambda x: "\n\n".join(x))
+    )

langchain-streamlit-demo/research_assistant/writer.py ADDED Viewed

	@@ -0,0 +1,78 @@

+from langchain.prompts import ChatPromptTemplate
+from langchain_core.output_parsers import StrOutputParser
+from langchain_core.runnables import ConfigurableField
+from langchain.llms.base import BaseLLM
+from langchain.schema.runnable import Runnable
+WRITER_SYSTEM_PROMPT = "You are an AI critical thinker research assistant. Your sole purpose is to write well written, critically acclaimed, objective and structured reports on given text."  # noqa: E501
+# Report prompts from https://github.com/assafelovic/gpt-researcher/blob/master/gpt_researcher/master/prompts.py
+RESEARCH_REPORT_TEMPLATE = """Information:
+--------
+{research_summary}
+--------
+Using the above information, answer the following question or topic: "{question}" in a detailed report -- \
+The report should focus on the answer to the question, should be well structured, informative, \
+in depth, with facts and numbers if available and a minimum of 1,200 words.
+You should strive to write the report as long as you can using all relevant and necessary information provided.
+You must write the report with markdown syntax.
+You MUST determine your own concrete and valid opinion based on the given information. Do NOT deter to general and meaningless conclusions.
+Write all used source urls at the end of the report, and make sure to not add duplicated sources, but only one reference for each.
+You must write the report in apa format.
+Please do your best, this is very important to my career."""  # noqa: E501
+RESOURCE_REPORT_TEMPLATE = """Information:
+--------
+{research_summary}
+--------
+Based on the above information, generate a bibliography recommendation report for the following question or topic: "{question}". \
+The report should provide a detailed analysis of each recommended resource, explaining how each source can contribute to finding answers to the research question. \
+Focus on the relevance, reliability, and significance of each source. \
+Ensure that the report is well-structured, informative, in-depth, and follows Markdown syntax. \
+Include relevant facts, figures, and numbers whenever available. \
+The report should have a minimum length of 1,200 words.
+Please do your best, this is very important to my career."""  # noqa: E501
+OUTLINE_REPORT_TEMPLATE = """Information:
+--------
+{research_summary}
+--------
+Using the above information, generate an outline for a research report in Markdown syntax for the following question or topic: "{question}". \
+The outline should provide a well-structured framework for the research report, including the main sections, subsections, and key points to be covered. \
+The research report should be detailed, informative, in-depth, and a minimum of 1,200 words. \
+Use appropriate Markdown syntax to format the outline and ensure readability.
+Please do your best, this is very important to my career."""  # noqa: E501
+prompt = ChatPromptTemplate.from_messages(
+    [
+        ("system", WRITER_SYSTEM_PROMPT),
+        ("user", RESEARCH_REPORT_TEMPLATE),
+    ],
+).configurable_alternatives(
+    ConfigurableField("report_type"),
+    default_key="research_report",
+    resource_report=ChatPromptTemplate.from_messages(
+        [
+            ("system", WRITER_SYSTEM_PROMPT),
+            ("user", RESOURCE_REPORT_TEMPLATE),
+        ],
+    ),
+    outline_report=ChatPromptTemplate.from_messages(
+        [
+            ("system", WRITER_SYSTEM_PROMPT),
+            ("user", OUTLINE_REPORT_TEMPLATE),
+        ],
+    ),
+)
+def get_writer_chain(model: BaseLLM) -> Runnable:
+    return prompt | model | StrOutputParser()

langchain-streamlit-demo/summarize.py ADDED Viewed

	@@ -0,0 +1,66 @@

+from langchain.chains.base import Chain
+from langchain.chains.summarize import load_summarize_chain
+from langchain.prompts import PromptTemplate
+from langchain.schema.language_model import BaseLanguageModel
+from langchain.schema.retriever import BaseRetriever
+from langchain.schema.runnable import RunnableSequence, RunnablePassthrough
+prompt_template = """Write a concise summary of the following text, based on the user input.
+User input: {query}
+Text:
+```
+{text}
+```
+CONCISE SUMMARY:"""
+refine_template = (
+    "You are iteratively crafting a summary of the text below based on the user input\n"
+    "User input: {query}\n"
+    "We have provided an existing summary up to a certain point: {existing_answer}\n"
+    "We have the opportunity to refine the existing summary"
+    "(only if needed) with some more context below.\n"
+    "------------\n"
+    "{text}\n"
+    "------------\n"
+    "Given the new context, refine the original summary.\n"
+    "If the context isn't useful, return the original summary.\n"
+    "If the context is useful, refine the summary to include the new context.\n"
+    "Your contribution is helping to build a comprehensive summary of a large body of knowledge.\n"
+    "You do not have the complete context, so do not discard pieces of the original summary."
+)
+def get_summarization_chain(
+    llm: BaseLanguageModel,
+    prompt: str,
+) -> Chain:
+    _prompt = PromptTemplate.from_template(
+        prompt_template,
+        partial_variables={"query": prompt},
+    )
+    refine_prompt = PromptTemplate.from_template(
+        refine_template,
+        partial_variables={"query": prompt},
+    )
+    return load_summarize_chain(
+        llm=llm,
+        chain_type="refine",
+        question_prompt=_prompt,
+        refine_prompt=refine_prompt,
+        return_intermediate_steps=False,
+        input_key="input_documents",
+        output_key="output_text",
+    )
+def get_rag_summarization_chain(
+    prompt: str,
+    retriever: BaseRetriever,
+    llm: BaseLanguageModel,
+    input_key: str = "prompt",
+) -> RunnableSequence:
+    return (
+        {"input_documents": retriever, input_key: RunnablePassthrough()}
+        | get_summarization_chain(llm, prompt)
+        | (lambda output: output["output_text"])
+    )

requirements.txt ADDED Viewed

	@@ -0,0 +1,23 @@

+anthropic==0.12.0
+beautifulsoup4==4.12.3
+black==24.1.1
+certifi>=2023.7.22 # not directly required, pinned by Snyk to avoid a vulnerability
+duckduckgo-search==4.3.2
+faiss-cpu==1.7.4
+langchain==0.1.4
+langsmith==0.0.84
+mypy==1.8.0
+numexpr==2.9.0
+numpy>=1.22.2 # not directly required, pinned by Snyk to avoid a vulnerability
+openai==1.10.0
+pillow>=10.2.0 # not directly required, pinned by Snyk to avoid a vulnerability
+pyarrow>=14.0.1 # not directly required, pinned by Snyk to avoid a vulnerability
+pypdf==4.0.1
+requests>=2.31.0 # not directly required, pinned by Snyk to avoid a vulnerability
+ruff==0.1.14
+streamlit==1.30.0
+streamlit-feedback==0.1.3
+tiktoken==0.5.2
+tornado>=6.3.3 # not directly required, pinned by Snyk to avoid a vulnerability
+validators>=0.21.0 # not directly required, pinned by Snyk to avoid a vulnerability
+wikipedia==1.4.0