Spaces:

MKJ-TOE
/

repository_reader

Running

App Files Files Community

DeL-TaiseiOzaki commited on Oct 30, 2024

Commit

6a71f13

1 Parent(s): d8c5049

LLMと会話する機能を追加

Browse files

Files changed (9) hide show

app.py +67 -34
config/__pycache__/__init__.cpython-310.pyc +0 -0
config/llm_settings.py +24 -0
core/__pycache__/__init__.cpython-310.pyc +0 -0
core/__pycache__/file_scanner.cpython-310.pyc +0 -0
main.py +0 -69
scan.sh +0 -49
services/__init__.py +0 -0
services/llm_service.py +83 -51

app.py CHANGED Viewed

@@ -1,10 +1,9 @@
 import streamlit as st
 import tempfile
 import git
 from pathlib import Path
 from datetime import datetime
-import time
-from core.file_scanner import FileScanner
 from services.llm_service import LLMService
 # ページ設定
@@ -14,20 +13,34 @@ st.set_page_config(
     layout="wide"
 )
-# カスタムCSS
 st.markdown("""
 <style>
-    .stAlert {
         padding: 1rem;
         margin: 1rem 0;
     }
-    .css-1v0mbdj.ebxwdo61 {
-        width: 100%;
-        max-width: 800px;
     }
 </style>
 """, unsafe_allow_html=True)
 def clone_repository(repo_url: str) -> Path:
     """リポジトリをクローンして一時ディレクトリに保存"""
     temp_dir = Path(tempfile.mkdtemp())
@@ -40,15 +53,24 @@ if 'repo_content' not in st.session_state:
 if 'temp_dir' not in st.session_state:
     st.session_state.temp_dir = None
 if 'llm_service' not in st.session_state:
-    st.session_state.llm_service = None
 # メインのUIレイアウト
 st.title("🔍 リポジトリ解析・質問システム")
-# OpenAI APIキーの設定
-api_key = st.sidebar.text_input("OpenAI APIキー", type="password", key="api_key")
-if api_key:
-    st.session_state.llm_service = LLMService(api_key)
 # URLの入力
 repo_url = st.text_input(
@@ -65,38 +87,50 @@ if st.button("スキャン開始", disabled=not repo_url):
         with st.spinner('ファイルをスキャン中...'):
             scanner = FileScanner(temp_dir)
-            files_content = scanner.scan_files()
-            if st.session_state.llm_service:
-                st.session_state.repo_content = LLMService.format_code_content(files_content)
-        st.success(f"スキャン完了: {len(files_content)}個のファイルを検出")
     except Exception as e:
         st.error(f"エラーが発生しました: {str(e)}")
 # スキャン完了後の質問セクション
-if st.session_state.repo_content and st.session_state.llm_service:
     st.divider()
     st.subheader("💭 コードについて質問する")
     query = st.text_area(
         "質問を入力してください",
         placeholder="例: このコードの主な機能は何ですか？"
     )
-    if st.button("質問する", disabled=not query):
-        with st.spinner('回答を生成中...'):
-            response, error = st.session_state.llm_service.get_response(
-                st.session_state.repo_content,
-                query
-            )
-            if error:
-                st.error(error)
-            else:
-                st.markdown("### 回答:")
-                st.markdown(response)
 # セッション終了時のクリーンアップ
 if st.session_state.temp_dir and Path(st.session_state.temp_dir).exists():
@@ -110,10 +144,9 @@ if st.session_state.temp_dir and Path(st.session_state.temp_dir).exists():
 with st.sidebar:
     st.subheader("📌 使い方")
     st.markdown("""
-    1. OpenAI APIキーを入力
-    2. GitHubリポジトリのURLを入力
-    3. スキャンを実行
-    4. コードについて質問
     """)
     st.subheader("🔍 スキャン対象")

 import streamlit as st
 import tempfile
 import git
+from core.file_scanner import FileScanner
 from pathlib import Path
 from datetime import datetime
 from services.llm_service import LLMService
 # ページ設定
     layout="wide"
 )
+# ダークテーマの設定
 st.markdown("""
 <style>
+    .stApp {
+        background-color: #0e1117;
+        color: #ffffff;
+    }
+    .chat-message {
         padding: 1rem;
         margin: 1rem 0;
+        border-radius: 0.5rem;
     }
+    .assistant-message {
+        background-color: #1e2329;
+        color: #ffffff;
+    }
+    .stButton button {
+        background-color: #2ea44f;
+        color: #ffffff;
+    }
+    .stTextArea textarea {
+        background-color: #1e2329;
+        color: #ffffff;
     }
 </style>
 """, unsafe_allow_html=True)
 def clone_repository(repo_url: str) -> Path:
     """リポジトリをクローンして一時ディレクトリに保存"""
     temp_dir = Path(tempfile.mkdtemp())
 if 'temp_dir' not in st.session_state:
     st.session_state.temp_dir = None
 if 'llm_service' not in st.session_state:
+    try:
+        st.session_state.llm_service = LLMService()
+    except ValueError as e:
+        st.error(str(e))
+        st.stop()
 # メインのUIレイアウト
 st.title("🔍 リポジトリ解析・質問システム")
+# サイドバーでモデル選択
+available_models = st.session_state.llm_service.settings.get_available_models()
+if len(available_models) > 1:
+    selected_model = st.sidebar.selectbox(
+        "使用するモデル",
+        available_models,
+        index=available_models.index(st.session_state.llm_service.current_model)
+    )
+    st.session_state.llm_service.switch_model(selected_model)
 # URLの入力
 repo_url = st.text_input(
         with st.spinner('ファイルをスキャン中...'):
             scanner = FileScanner(temp_dir)
+            files = scanner.scan_files()  # List[FileInfo] を取得
+            st.session_state.repo_content = LLMService.format_code_content(files)
+        st.success(f"スキャン完了: {len(files)}個のファイルを検出")
+        # 新しいスキャン時に会話履歴をクリア
+        st.session_state.llm_service.clear_history()
     except Exception as e:
         st.error(f"エラーが発生しました: {str(e)}")
 # スキャン完了後の質問セクション
+if st.session_state.repo_content:
     st.divider()
     st.subheader("💭 コードについて質問する")
+    # 会話履歴の表示（アシスタントの回答のみ）
+    for message in st.session_state.llm_service.conversation_history:
+        if message.role == "assistant":  # アシスタントの回答のみを表示
+            st.markdown(f'<div class="chat-message assistant-message">{message.content}</div>',
+                       unsafe_allow_html=True)
     query = st.text_area(
         "質問を入力してください",
         placeholder="例: このコードの主な機能は何ですか？"
     )
+    col1, col2 = st.columns([1, 5])
+    with col1:
+        if st.button("履歴クリア"):
+            st.session_state.llm_service.clear_history()
+            st.rerun()
+    with col2:
+        if st.button("質問する", disabled=not query):
+            with st.spinner('回答を生成中...'):
+                response, error = st.session_state.llm_service.get_response(
+                    st.session_state.repo_content,
+                    query
+                )
+                if error:
+                    st.error(error)
+                else:
+                    st.rerun()  # 会話履歴を更新するために再表示
 # セッション終了時のクリーンアップ
 if st.session_state.temp_dir and Path(st.session_state.temp_dir).exists():
 with st.sidebar:
     st.subheader("📌 使い方")
     st.markdown("""
+    1. GitHubリポジトリのURLを入力
+    2. スキャンを実行
+    3. コードについて質問（最大5ターンの会話が可能）
     """)
     st.subheader("🔍 スキャン対象")

config/__pycache__/__init__.cpython-310.pyc CHANGED Viewed

Binary files a/config/__pycache__/__init__.cpython-310.pyc and b/config/__pycache__/__init__.cpython-310.pyc differ

config/llm_settings.py ADDED Viewed

	@@ -0,0 +1,24 @@

+import os
+from dotenv import load_dotenv
+from typing import Literal
+class LLMSettings:
+    def __init__(self):
+        load_dotenv()
+        self.openai_api_key = os.getenv('OPENAI_API_KEY')
+        self.anthropic_api_key = os.getenv('ANTHROPIC_API_KEY')
+        self.default_llm = os.getenv('DEFAULT_LLM', 'claude')
+        # API キーの存在確認
+        if not self.openai_api_key and not self.anthropic_api_key:
+            raise ValueError("少なくとも1つのAPIキーが必要です。")
+    def get_available_models(self) -> list[Literal['claude', 'gpt']]:
+        """利用可能なモデルのリストを返す"""
+        models = []
+        if self.anthropic_api_key:
+            models.append('claude')
+        if self.openai_api_key:
+            models.append('gpt')
+        return models

core/__pycache__/__init__.cpython-310.pyc CHANGED Viewed

Binary files a/core/__pycache__/__init__.cpython-310.pyc and b/core/__pycache__/__init__.cpython-310.pyc differ

core/__pycache__/file_scanner.cpython-310.pyc CHANGED Viewed

Binary files a/core/__pycache__/file_scanner.cpython-310.pyc and b/core/__pycache__/file_scanner.cpython-310.pyc differ

main.py DELETED Viewed

@@ -1,69 +0,0 @@
-import sys
-from pathlib import Path
-from config.settings import Settings
-from core.git_manager import GitManager
-from core.file_scanner import FileScanner
-from utils.file_writer import FileWriter
-def main():
-    # コマンドライン引数からパスを取得
-    if len(sys.argv) != 2:
-        print("Usage: python main.py <github_url or directory_path>")
-        return 1
-    target_path = sys.argv[1]
-    timestamp = Settings.get_timestamp()
-    output_file = Settings.get_output_file(timestamp)
-    # GitHubのURLかローカルパスかを判定
-    is_github = target_path.startswith(('http://', 'https://')) and 'github.com' in target_path
-    try:
-        if is_github:
-            # GitHubリポジトリの場合
-            clone_dir = Settings.get_clone_dir(timestamp)
-            print(f"Cloning repository: {target_path}")
-            git_manager = GitManager(target_path, clone_dir)
-            git_manager.clone_repository()
-            scanner = FileScanner(clone_dir)
-            cleanup_needed = True
-        else:
-            # ローカルディレクトリの場合
-            target_dir = Path(target_path)
-            if not target_dir.exists():
-                print(f"Error: Directory not found: {target_dir}")
-                return 1
-            scanner = FileScanner(target_dir)
-            cleanup_needed = False
-        # ファイルスキャンと保存
-        print("Scanning files...")
-        files = scanner.scan_files()
-        print(f"Writing contents to {output_file}")
-        writer = FileWriter(output_file)
-        writer.write_contents(files)
-        print(f"Found {len(files)} files")
-        print(f"Results saved to {output_file}")
-    except Exception as e:
-        print(f"Error: {e}")
-        return 1
-    finally:
-        # GitHubリポジトリの場合はクリーンアップ
-        if is_github and cleanup_needed and 'git_manager' in locals():
-            try:
-                git_manager.cleanup()
-                print("Cleanup completed")
-            except Exception as e:
-                print(f"Cleanup error: {e}")
-    return 0
-if __name__ == "__main__":
-    exit(main())

scan.sh DELETED Viewed

@@ -1,49 +0,0 @@
-#!/bin/bash
-# エラーが発生した場合に停止
-set -e
-# デフォルトのターゲットパスを設定
-# ここを変更することで対象を変更できます
-TARGET_PATH="https://github.com/DeL-TaiseiOzaki/idebate_scraping.git"  # 例: Linuxカーネル
-# TARGET_PATH="/path/to/your/directory"  # ローカルディレクトリの例
-# 必要なディレクトリの存在確認
-if [ ! -d "output" ]; then
-    mkdir output
-fi
-# Pythonの存在確認
-if ! command -v python3 &> /dev/null; then
-    echo "Error: Python3 is not installed"
-    exit 1
-fi
-# GitHubリポジトリの場合、Gitの存在確認
-if [[ $TARGET_PATH == http* ]] && [[ $TARGET_PATH == *github.com* ]]; then
-    if ! command -v git &> /dev/null; then
-        echo "Error: Git is not installed"
-        exit 1
-    fi
-    echo "Scanning GitHub repository: $TARGET_PATH"
-else
-    if [ ! -d "$TARGET_PATH" ]; then
-        echo "Error: Directory not found: $TARGET_PATH"
-        exit 1
-    fi
-    echo "Scanning local directory: $TARGET_PATH"
-fi
-# スキャンの実行
-echo "Starting directory scan..."
-python3 main.py "$TARGET_PATH"
-exit_code=$?
-if [ $exit_code -eq 0 ]; then
-    echo "Scan completed successfully!"
-    echo "Results are saved in the 'output' directory"
-else
-    echo "Scan failed with exit code: $exit_code"
-    exit $exit_code
-fi

services/__init__.py ADDED Viewed

File without changes

services/llm_service.py CHANGED Viewed

@@ -1,26 +1,39 @@
-from typing import Optional
 import openai
-from pathlib import Path
 class LLMService:
-    def __init__(self, api_key: str):
-        """
-        LLMサービスの初期化
-        Args:
-            api_key: OpenAI APIキー
-        """
-        self.api_key = api_key
-        openai.api_key = api_key
     def create_prompt(self, content: str, query: str) -> str:
-        """
-        プロンプトを生成
-        Args:
-            content: コードの内容
-            query: ユーザーからの質問
-        Returns:
-            生成されたプロンプト
-        """
         return f"""以下はGitHubリポジトリのコード解析結果です。このコードについて質問に答えてください。
 コード解析結果:
@@ -30,49 +43,68 @@ class LLMService:
 できるだけ具体的に、コードの内容を参照しながら回答してください。"""
-    def get_response(self, content: str, query: str) -> tuple[str, Optional[str]]:
-        """
-        LLMを使用して回答を生成
-        Args:
-            content: コードの内容
-            query: ユーザーからの質問
-        Returns:
-            (回答, エラーメッセージ)のタプル
-        """
         try:
             prompt = self.create_prompt(content, query)
-            response = openai.ChatCompletion.create(
-                model="gpt-3.5-turbo-16k",
-                messages=[
-                    {
-                        "role": "system",
-                        "content": "あなたはコードアナリストとして、リポジトリの解析と質問への回答を行います。"
-                    },
-                    {
-                        "role": "user",
-                        "content": prompt
-                    }
-                ]
-            )
-            return response.choices[0].message.content, None
         except Exception as e:
             return None, f"エラーが発生しました: {str(e)}"
     @staticmethod
-    def format_code_content(files_content: dict) -> str:
-        """
-        ファイル内容をプロンプト用にフォーマット
-        Args:
-            files_content: ファイルパスと内容の辞書
-        Returns:
-            フォーマットされたテキスト
-        """
         formatted_content = []
-        for file_path, content in files_content.items():
             formatted_content.append(
-                f"#ファイルパス\n{file_path}\n------------\n{content}\n"
             )
         return "\n".join(formatted_content)

+from typing import Optional, List, Dict, Any
 import openai
+import anthropic
+from dataclasses import dataclass
+from config.llm_settings import LLMSettings
+from core.file_scanner import FileInfo
+@dataclass
+class Message:
+    role: str
+    content: str
 class LLMService:
+    MAX_TURNS = 5
+    def __init__(self):
+        """LLMサービスの初期化"""
+        self.settings = LLMSettings()
+        self.current_model = self.settings.default_llm
+        # API クライアントの初期化
+        if self.settings.anthropic_api_key:
+            self.claude_client = anthropic.Anthropic(api_key=self.settings.anthropic_api_key)
+        if self.settings.openai_api_key:
+            openai.api_key = self.settings.openai_api_key
+        self.conversation_history: List[Message] = []
+    def switch_model(self, model: str):
+        """使用するモデルを切り替え"""
+        if model not in self.settings.get_available_models():
+            raise ValueError(f"モデル {model} は利用できません")
+        self.current_model = model
     def create_prompt(self, content: str, query: str) -> str:
+        """プロンプトを生成"""
         return f"""以下はGitHubリポジトリのコード解析結果です。このコードについて質問に答えてください。
 コード解析結果:
 できるだけ具体的に、コードの内容を参照しながら回答してください。"""
+    def _add_to_history(self, role: str, content: str):
+        """会話履歴に追加（最大5ターン）"""
+        self.conversation_history.append(Message(role=role, content=content))
+        # 最大ターン数を超えた場合、古い会話を削除
+        if len(self.conversation_history) > self.MAX_TURNS * 2:  # 各ターンは質問と回答で2メッセージ
+            self.conversation_history = self.conversation_history[-self.MAX_TURNS * 2:]
+    def _format_messages_for_claude(self) -> List[Dict[str, str]]:
+        """Claude用にメッセージをフォーマット"""
+        return [{"role": msg.role, "content": msg.content}
+                for msg in self.conversation_history]
+    def _format_messages_for_gpt(self) -> List[Dict[str, str]]:
+        """GPT用にメッセージをフォーマット"""
+        return [
+            {"role": "system", "content": "あなたはコードアナリストとして、リポジトリの解析と質問への回答を行います。"},
+            *[{"role": msg.role, "content": msg.content}
+              for msg in self.conversation_history]
+        ]
+    def get_conversation_history(self) -> List[Dict[str, str]]:
+        """会話履歴を取得"""
+        return [{"role": msg.role, "content": msg.content}
+                for msg in self.conversation_history]
+    def clear_history(self):
+        """会話履歴をクリア"""
+        self.conversation_history = []
+    def get_response(self, content: str, query: str) -> tuple[Optional[str], Optional[str]]:
+        """LLMを使用して回答を生成"""
         try:
             prompt = self.create_prompt(content, query)
+            self._add_to_history("user", prompt)
+            if self.current_model == 'claude':
+                response = self.claude_client.messages.create(
+                    model="claude-3-sonnet-20240229",
+                    max_tokens=4000,
+                    messages=self._format_messages_for_claude()
+                )
+                answer = response.content[0].text
+            else:  # gpt
+                response = openai.ChatCompletion.create(
+                    model="gpt-3.5-turbo-16k",
+                    messages=self._format_messages_for_gpt()
+                )
+                answer = response.choices[0].message.content
+            self._add_to_history("assistant", answer)
+            return answer, None
         except Exception as e:
             return None, f"エラーが発生しました: {str(e)}"
     @staticmethod
+    def format_code_content(files: List[FileInfo]) -> str:
+        """ファイル内容をプロンプト用にフォーマット"""
         formatted_content = []
+        for file_info in files:
             formatted_content.append(
+                f"#ファイルパス\n{file_info.path}\n------------\n{file_info.content}\n"
             )
         return "\n".join(formatted_content)