Spaces:

MKJ-TOE
/

repository_reader

Running

App Files Files Community

DeL-TaiseiOzaki commited on Oct 30, 2024

Commit

227e75d

1 Parent(s): 0b1e3e4

first commit

Browse files

Files changed (24) hide show

README copy.md +96 -0
app.py +130 -0
config/__init__.py +0 -0
config/__pycache__/__init__.cpython-310.pyc +0 -0
config/__pycache__/setting.cpython-310.pyc +0 -0
config/__pycache__/settings.cpython-310.pyc +0 -0
config/settings.py +18 -0
core/__init__.py +0 -0
core/__pycache__/__init__.cpython-310.pyc +0 -0
core/__pycache__/file_scanner.cpython-310.pyc +0 -0
core/__pycache__/git_manager.cpython-310.pyc +0 -0
core/file_scanner.py +60 -0
core/git_manager.py +34 -0
main.py +69 -0
output/scan_result_20241030_210745.txt +242 -0
rquirements.txt +4 -0
scan.sh +49 -0
services/llm_service.py +78 -0
utils/__init__.py +0 -0
utils/__pycache__/__init__.cpython-310.pyc +0 -0
utils/__pycache__/content_exporter.cpython-310.pyc +0 -0
utils/__pycache__/file_writer.cpython-310.pyc +0 -0
utils/file_writer.py +24 -0
utils/logger.py +26 -0

README copy.md ADDED Viewed

	@@ -0,0 +1,96 @@

+# get_repository_info_by_llm
+プログラミング関連ファイルを再帰的にスキャンし、内容を単一のテキストファイルにエクスポートするツールです。GitHubリポジトリまたはローカルディレクトリに対応しています。
+## 機能
+- GitHubリポジトリのクローンとスキャン
+- ローカルディレクトリのスキャン
+- 再帰的なファイル検索
+- 主要なプログラミング言語ファイルの検出
+- UTF-8/CP932エンコーディングの自動検出
+- 結果のテキストファイル出力
+## 必要条件
+- Python 3.7以上
+- Git（GitHubリポジトリをスキャンする場合）
+## インストール
+1. リポジトリをクローン
+```bash
+git clone [このリポジトリのURL]
+cd directory-scanner
+```
+2. 必要なディレクトリを作成
+```bash
+mkdir output
+```
+## 使用方法
+### コマンドライン
+```bash
+# GitHubリポジトリをスキャン
+python main.py https://github.com/username/repository.git
+# ローカルディレクトリをスキャン
+python main.py /path/to/directory
+```
+### シェルスクリプトを使用
+```bash
+# スクリプトに実行権限を付与
+chmod +x scan.sh
+# GitHubリポジトリをスキャン
+./scan.sh https://github.com/username/repository.git
+# ローカルディレクトリをスキャン
+./scan.sh /path/to/directory
+```
+## 出力形式
+スキャン結果は `output` ディレクトリに保存され、以下の形式で出力されます：
+```
+#ファイルパス
+path/to/file.py
+------------
+ファイルの内容
+```
+## スキャン対象
+### 対象となるファイル拡張子
+- Python (.py)
+- JavaScript (.js)
+- Java (.java)
+- C/C++ (.c, .h, .cpp, .hpp)
+- Go (.go)
+- Rust (.rs)
+- PHP (.php)
+- Ruby (.rb)
+- TypeScript (.ts)
+- その他 (.scala, .kt, .cs, .swift, .m, .sh, .pl, .r)
+### 除外されるディレクトリ
+- .git
+- __pycache__
+- node_modules
+- venv
+- .env
+- build
+- dist
+- target
+- bin
+- obj
+## 注意事項
+- GitHubリポジトリをスキャンする場合、一時的にローカルにクローンされます
+- スキャン完了後、クローンされたリポジトリは自動的に削除されます
+- 大きなファイルや特殊なエンコーディングのファイルは読み取れない場合があります

app.py ADDED Viewed

	@@ -0,0 +1,130 @@

+import streamlit as st
+import tempfile
+import git
+from pathlib import Path
+from datetime import datetime
+import time
+from dotenv import load_dotenv
+from core.file_scanner import FileScanner
+from services.llm_service import LLMService
+# 環境変数の読み込み
+load_dotenv()
+# ページ設定
+st.set_page_config(
+    page_title="Repository Code Analysis",
+    page_icon="🔍",
+    layout="wide"
+)
+# カスタムCSS
+st.markdown("""
+<style>
+    .stAlert {
+        padding: 1rem;
+        margin: 1rem 0;
+    }
+    .css-1v0mbdj.ebxwdo61 {
+        width: 100%;
+        max-width: 800px;
+    }
+</style>
+""", unsafe_allow_html=True)
+def clone_repository(repo_url: str) -> Path:
+    """リポジトリをクローンして一時ディレクトリに保存"""
+    temp_dir = Path(tempfile.mkdtemp())
+    git.Repo.clone_from(repo_url, temp_dir)
+    return temp_dir
+# セッション状態の初期化
+if 'repo_content' not in st.session_state:
+    st.session_state.repo_content = None
+if 'temp_dir' not in st.session_state:
+    st.session_state.temp_dir = None
+if 'llm_service' not in st.session_state:
+    st.session_state.llm_service = None
+# メインのUIレイアウト
+st.title("🔍 リポジトリ解析・質問システム")
+# OpenAI APIキーの設定
+api_key = st.sidebar.text_input("OpenAI APIキー", type="password", key="api_key")
+if api_key:
+    st.session_state.llm_service = LLMService(api_key)
+# URLの入力
+repo_url = st.text_input(
+    "GitHubリポジトリのURLを入力",
+    placeholder="https://github.com/username/repository.git"
+)
+# スキャン実行ボタン
+if st.button("スキャン開始", disabled=not repo_url):
+    try:
+        with st.spinner('リポジトリをクローン中...'):
+            temp_dir = clone_repository(repo_url)
+            st.session_state.temp_dir = temp_dir
+        with st.spinner('ファイルをスキャン中...'):
+            scanner = FileScanner(temp_dir)
+            files_content = scanner.scan_files()
+            if st.session_state.llm_service:
+                st.session_state.repo_content = LLMService.format_code_content(files_content)
+        st.success(f"スキャン完了: {len(files_content)}個のファイルを検出")
+    except Exception as e:
+        st.error(f"エラーが発生しました: {str(e)}")
+# スキャン完了後の質問セクション
+if st.session_state.repo_content and st.session_state.llm_service:
+    st.divider()
+    st.subheader("💭 コードについて質問する")
+    query = st.text_area(
+        "質問を入力してください",
+        placeholder="例: このコードの主な機能は何ですか？"
+    )
+    if st.button("質問する", disabled=not query):
+        with st.spinner('回答を生成中...'):
+            response, error = st.session_state.llm_service.get_response(
+                st.session_state.repo_content,
+                query
+            )
+            if error:
+                st.error(error)
+            else:
+                st.markdown("### 回答:")
+                st.markdown(response)
+# セッション終了時のクリーンアップ
+if st.session_state.temp_dir and Path(st.session_state.temp_dir).exists():
+    try:
+        import shutil
+        shutil.rmtree(st.session_state.temp_dir)
+    except:
+        pass
+# サイドバー情報
+with st.sidebar:
+    st.subheader("📌 使い方")
+    st.markdown("""
+    1. OpenAI APIキーを入力
+    2. GitHubリポジトリのURLを入力
+    3. スキャンを実行
+    4. コードについて質問
+    """)
+    st.subheader("🔍 スキャン対象")
+    st.markdown("""
+    - Python (.py)
+    - JavaScript (.js)
+    - Java (.java)
+    - C/C++ (.c, .h, .cpp, .hpp)
+    - その他の主要なプログラミング言語
+    """)

config/__init__.py ADDED Viewed

File without changes

config/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (153 Bytes). View file

config/__pycache__/setting.cpython-310.pyc ADDED Viewed

Binary file (1.02 kB). View file

config/__pycache__/settings.cpython-310.pyc ADDED Viewed

Binary file (1.03 kB). View file

config/settings.py ADDED Viewed

	@@ -0,0 +1,18 @@

+from pathlib import Path
+from datetime import datetime
+class Settings:
+    DEFAULT_OUTPUT_DIR = Path("output")
+    TIMESTAMP_FORMAT = "%Y%m%d_%H%M%S"
+    @classmethod
+    def get_timestamp(cls) -> str:
+        return datetime.now().strftime(cls.TIMESTAMP_FORMAT)
+    @classmethod
+    def get_clone_dir(cls, timestamp: str) -> Path:
+        return cls.DEFAULT_OUTPUT_DIR / f"repo_clone_{timestamp}"
+    @classmethod
+    def get_output_file(cls, timestamp: str) -> Path:
+        return cls.DEFAULT_OUTPUT_DIR / f"scan_result_{timestamp}.txt"

core/__init__.py ADDED Viewed

File without changes

core/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (151 Bytes). View file

core/__pycache__/file_scanner.cpython-310.pyc ADDED Viewed

Binary file (2.55 kB). View file

core/__pycache__/git_manager.cpython-310.pyc ADDED Viewed

Binary file (1.3 kB). View file

core/file_scanner.py ADDED Viewed

	@@ -0,0 +1,60 @@

+from pathlib import Path
+from typing import List, Dict, Optional
+from dataclasses import dataclass
+@dataclass
+class FileInfo:
+    path: Path
+    content: Optional[str] = None
+class FileScanner:
+    # スキャン対象の拡張子
+    TARGET_EXTENSIONS = {
+        '.py', '.js', '.java', '.cpp', '.hpp', '.c', '.h',
+        '.go', '.rs', '.php', '.rb', '.ts', '.scala', '.kt',
+        '.cs', '.swift', '.m', '.sh', '.pl', '.r'
+    }
+    # スキャン対象から除外するディレクトリ
+    EXCLUDED_DIRS = {
+        '.git', '__pycache__', 'node_modules', 'venv', '.env',
+        'build', 'dist', 'target', 'bin', 'obj'
+    }
+    def __init__(self, base_dir: Path):
+        self.base_dir = base_dir
+    def _should_scan_file(self, path: Path) -> bool:
+        if any(excluded in path.parts for excluded in self.EXCLUDED_DIRS):
+            return False
+        return path.suffix.lower() in self.TARGET_EXTENSIONS
+    def _read_file_content(self, file_path: Path) -> Optional[str]:
+        try:
+            # まずUTF-8で試す
+            try:
+                with file_path.open('r', encoding='utf-8') as f:
+                    return f.read()
+            except UnicodeDecodeError:
+                # UTF-8で失敗したらcp932を試す
+                with file_path.open('r', encoding='cp932') as f:
+                    return f.read()
+        except (OSError, UnicodeDecodeError):
+            return None
+    def scan_files(self) -> List[FileInfo]:
+        if not self.base_dir.exists():
+            raise FileNotFoundError(f"Directory not found: {self.base_dir}")
+        files = []
+        for entry in self.base_dir.rglob('*'):
+            if entry.is_file() and self._should_scan_file(entry):
+                content = self._read_file_content(entry)
+                if content is not None:
+                    files.append(FileInfo(
+                        path=entry.relative_to(self.base_dir),
+                        content=content
+                    ))
+        return sorted(files, key=lambda x: str(x.path))

core/git_manager.py ADDED Viewed

	@@ -0,0 +1,34 @@

+import subprocess
+from pathlib import Path
+class GitManager:
+    def __init__(self, repo_url: str, target_dir: Path):
+        self.repo_url = repo_url
+        self.target_dir = target_dir
+    def clone_repository(self) -> bool:
+        try:
+            if self.target_dir.exists():
+                raise FileExistsError(f"Directory already exists: {self.target_dir}")
+            self.target_dir.parent.mkdir(parents=True, exist_ok=True)
+            subprocess.run(
+                ["git", "clone", self.repo_url, str(self.target_dir)],
+                check=True,
+                capture_output=True,
+                text=True
+            )
+            return True
+        except subprocess.CalledProcessError as e:
+            raise RuntimeError(f"Clone error: {e.stderr}")
+    def cleanup(self):
+        if self.target_dir.exists():
+            subprocess.run(
+                ["rm", "-rf", str(self.target_dir)],
+                check=True,
+                capture_output=True,
+                text=True
+            )

main.py ADDED Viewed

	@@ -0,0 +1,69 @@

+import sys
+from pathlib import Path
+from config.settings import Settings
+from core.git_manager import GitManager
+from core.file_scanner import FileScanner
+from utils.file_writer import FileWriter
+def main():
+    # コマンドライン引数からパスを取得
+    if len(sys.argv) != 2:
+        print("Usage: python main.py <github_url or directory_path>")
+        return 1
+    target_path = sys.argv[1]
+    timestamp = Settings.get_timestamp()
+    output_file = Settings.get_output_file(timestamp)
+    # GitHubのURLかローカルパスかを判定
+    is_github = target_path.startswith(('http://', 'https://')) and 'github.com' in target_path
+    try:
+        if is_github:
+            # GitHubリポジトリの場合
+            clone_dir = Settings.get_clone_dir(timestamp)
+            print(f"Cloning repository: {target_path}")
+            git_manager = GitManager(target_path, clone_dir)
+            git_manager.clone_repository()
+            scanner = FileScanner(clone_dir)
+            cleanup_needed = True
+        else:
+            # ローカルディレクトリの場合
+            target_dir = Path(target_path)
+            if not target_dir.exists():
+                print(f"Error: Directory not found: {target_dir}")
+                return 1
+            scanner = FileScanner(target_dir)
+            cleanup_needed = False
+        # ファイルスキャンと保存
+        print("Scanning files...")
+        files = scanner.scan_files()
+        print(f"Writing contents to {output_file}")
+        writer = FileWriter(output_file)
+        writer.write_contents(files)
+        print(f"Found {len(files)} files")
+        print(f"Results saved to {output_file}")
+    except Exception as e:
+        print(f"Error: {e}")
+        return 1
+    finally:
+        # GitHubリポジトリの場合はクリーンアップ
+        if is_github and cleanup_needed and 'git_manager' in locals():
+            try:
+                git_manager.cleanup()
+                print("Cleanup completed")
+            except Exception as e:
+                print(f"Cleanup error: {e}")
+    return 0
+if __name__ == "__main__":
+    exit(main())

output/scan_result_20241030_210745.txt ADDED Viewed

	@@ -0,0 +1,242 @@

+#ファイルパス
+Get_URL_list/get_url_list.py
+------------
+import json
+import requests
+from bs4 import BeautifulSoup
+# Load URLs from JSON file
+with open('ideabte_scraping/Get_URL_list/URL_json_output/debate_urls.json', 'r') as f:
+    json_urls = json.load(f)
+# Function to get sub-page URLs from a main theme URL
+def get_debate_topic_urls(main_url):
+    response = requests.get(main_url)
+    soup = BeautifulSoup(response.text, 'html.parser')
+    # Extract all links from the main URL page
+    links = soup.find_all('a', href=True)
+    # Filter for links that are debate topics
+    topic_urls = [link['href'] for link in links if link['href'].startswith('/')]
+    # Make URLs absolute
+    full_urls = [f"https://idebate.net{url}" for url in topic_urls if "~b" in url]
+    return full_urls
+# Dictionary to store all debate topic URLs for each main theme URL
+all_debate_topic_urls = {}
+for theme_url in json_urls:
+    theme_name = theme_url.split("/")[-2].replace("~", "_")
+    all_debate_topic_urls[theme_name] = get_debate_topic_urls(theme_url)
+# Output the results
+with open('ideabte_scraping/Get_URL_list/output/debate_topic_urls.json', 'w') as f:
+    json.dump(all_debate_topic_urls, f, indent=4)
+print("Debate topic URLs have been saved to debate_topic_urls.json")
+#ファイルパス
+scraping_idebate/run_main.sh
+------------
+#!/bin/bash
+# Set default paths
+JSON_FILE="ideabte_scraping/Get_URL_list/output/debate_topic_urls.json"
+OUTPUT_DIR="ideabte_scraping/scraping_idebate/output"
+# Check if the JSON file exists
+if [ ! -f "$JSON_FILE" ]; then
+    echo "Error: JSON file '$JSON_FILE' does not exist."
+    exit 1
+fi
+# Create the output directory if it doesn't exist
+mkdir -p "$OUTPUT_DIR"
+# Run the Python script
+python3 ideabte_scraping/scraping_idebate/src/scraping.py "$JSON_FILE" "$OUTPUT_DIR"
+echo "Scraping completed. Output files are stored in $OUTPUT_DIR"
+#ファイルパス
+scraping_idebate/src/scraping.py
+------------
+import requests
+from bs4 import BeautifulSoup
+import json
+import os
+import sys
+from urllib.parse import urlparse
+def scrape_url(url, output_dir):
+    response = requests.get(url)
+    response.raise_for_status()
+    soup = BeautifulSoup(response.content, 'html.parser')
+    topic = soup.find("h1", class_="blog-post__title").get_text(strip=True)
+    points_list = []
+    def extract_points(section, section_name):
+        accordion_items = section.find_next_sibling('div', class_='accordion').find_all('div', class_='accordion__item')
+        for item in accordion_items:
+            point_subtitle = item.find('h4', class_='accordion__subtitle').get_text().strip()
+            point_body = item.find('div', class_='accordion__body').find('p').get_text().strip()
+            points_list.append({
+                "topic": topic,
+                "section": section_name,
+                "context": f"**{point_subtitle}**\n{point_body}"
+            })
+    points_for_section = soup.find('div', class_='points-vote points-vote--for')
+    if points_for_section:
+        extract_points(points_for_section, "Points For")
+    points_against_section = soup.find('div', class_='points-vote points-vote--against')
+    if points_against_section:
+        extract_points(points_against_section, "Points Against")
+    # Generate a unique filename based on the URL
+    parsed_url = urlparse(url)
+    filename = f"{parsed_url.path.strip('/').replace('/', '_')}.json"
+    output_path = os.path.join(output_dir, filename)
+    with open(output_path, "w", encoding="utf-8") as f:
+        json.dump(points_list, f, ensure_ascii=False, indent=4)
+    print(f"Data saved to {output_path}")
+if __name__ == "__main__":
+    if len(sys.argv) != 3:
+        print("Usage: python script.py <json_file> <output_dir>")
+        sys.exit(1)
+    json_file = sys.argv[1]
+    output_dir = sys.argv[2]
+    os.makedirs(output_dir, exist_ok=True)
+    with open(json_file, 'r') as f:
+        url_data = json.load(f)
+    for category, urls in url_data.items():
+        for url in urls:
+            try:
+                scrape_url(url, output_dir)
+            except Exception as e:
+                print(f"Error scraping {url}: {str(e)}")
+#ファイルパス
+scraping_idebate/src/scraping_test.py
+------------
+import requests
+from bs4 import BeautifulSoup
+url = "https://idebate.net/this-house-would-make-all-museums-free-of-charge~b641/"
+# ウェブページを取得
+response = requests.get(url)
+response.raise_for_status()  # エラーチェック
+# HTMLを解析
+soup = BeautifulSoup(response.content, 'html.parser')
+# Points Forのdiv要素を取得
+points_for_section = soup.find('div', class_='points-vote points-vote--for')
+# ポイントを含むアコーディオン要素を取得
+accordion_items = points_for_section.find_next_sibling('div', class_='accordion').find_all('div', class_='accordion__item')
+# 各ポイントのテキストを抽出
+points = []
+for item in accordion_items:
+    point_subtitle = item.find('h4', class_='accordion__subtitle').get_text().strip()
+    point_body = item.find('div', class_='accordion__body').find('p').get_text().strip()
+    points.append(f"**{point_subtitle}**\n{point_body}")
+# 抽出したポイントを出力
+for point in points:
+    print(point)
+    print("-" * 20)  # 区切り線
+#ファイルパス
+scraping_idebate/src/scraping_tqdm.py
+------------
+import requests
+from bs4 import BeautifulSoup
+import json
+import os
+import sys
+from urllib.parse import urlparse
+from tqdm import tqdm
+def scrape_url(url, output_dir):
+    response = requests.get(url)
+    response.raise_for_status()
+    soup = BeautifulSoup(response.content, 'html.parser')
+    topic = soup.find("h1", class_="blog-post__title").get_text(strip=True)
+    points_list = []
+    def extract_points(section, section_name):
+        accordion_items = section.find_next_sibling('div', class_='accordion').find_all('div', class_='accordion__item')
+        for item in accordion_items:
+            point_subtitle = item.find('h4', class_='accordion__subtitle').get_text().strip()
+            point_body = item.find('div', class_='accordion__body').find('p').get_text().strip()
+            points_list.append({
+                "topic": topic,
+                "section": section_name,
+                "context": f"**{point_subtitle}**\n{point_body}"
+            })
+    points_for_section = soup.find('div', class_='points-vote points-vote--for')
+    if points_for_section:
+        extract_points(points_for_section, "Points For")
+    points_against_section = soup.find('div', class_='points-vote points-vote--against')
+    if points_against_section:
+        extract_points(points_against_section, "Points Against")
+    # Generate a unique filename based on the URL
+    parsed_url = urlparse(url)
+    filename = f"{parsed_url.path.strip('/').replace('/', '_')}.json"
+    output_path = os.path.join(output_dir, filename)
+    with open(output_path, "w", encoding="utf-8") as f:
+        json.dump(points_list, f, ensure_ascii=False, indent=4)
+    return output_path
+if __name__ == "__main__":
+    if len(sys.argv) != 3:
+        print("Usage: python script.py <json_file> <output_dir>")
+        sys.exit(1)
+    json_file = sys.argv[1]
+    output_dir = sys.argv[2]
+    os.makedirs(output_dir, exist_ok=True)
+    with open(json_file, 'r') as f:
+        url_data = json.load(f)
+    total_urls = sum(len(urls) for urls in url_data.values())
+    with tqdm(total=total_urls, desc="Scraping Progress") as pbar:
+        for category, urls in url_data.items():
+            for url in urls:
+                try:
+                    output_path = scrape_url(url, output_dir)
+                    pbar.set_postfix_str(f"Saved: {output_path}")
+                    pbar.update(1)
+                except Exception as e:
+                    pbar.set_postfix_str(f"Error: {url}")
+                    print(f"\nError scraping {url}: {str(e)}")
+                    pbar.update(1)
+    print("\nScraping completed. All data saved to the output directory.")

rquirements.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+streamlit>=1.24.0
+openai>=0.27.0
+pathlib>=1.0.1
+chardet>=4.0.0

scan.sh ADDED Viewed

	@@ -0,0 +1,49 @@

+#!/bin/bash
+# エラーが発生した場合に停止
+set -e
+# デフォルトのターゲットパスを設定
+# ここを変更することで対象を変更できます
+TARGET_PATH="https://github.com/DeL-TaiseiOzaki/idebate_scraping.git"  # 例: Linuxカーネル
+# TARGET_PATH="/path/to/your/directory"  # ローカルディレクトリの例
+# 必要なディレクトリの存在確認
+if [ ! -d "output" ]; then
+    mkdir output
+fi
+# Pythonの存在確認
+if ! command -v python3 &> /dev/null; then
+    echo "Error: Python3 is not installed"
+    exit 1
+fi
+# GitHubリポジトリの場合、Gitの存在確認
+if [[ $TARGET_PATH == http* ]] && [[ $TARGET_PATH == *github.com* ]]; then
+    if ! command -v git &> /dev/null; then
+        echo "Error: Git is not installed"
+        exit 1
+    fi
+    echo "Scanning GitHub repository: $TARGET_PATH"
+else
+    if [ ! -d "$TARGET_PATH" ]; then
+        echo "Error: Directory not found: $TARGET_PATH"
+        exit 1
+    fi
+    echo "Scanning local directory: $TARGET_PATH"
+fi
+# スキャンの実行
+echo "Starting directory scan..."
+python3 main.py "$TARGET_PATH"
+exit_code=$?
+if [ $exit_code -eq 0 ]; then
+    echo "Scan completed successfully!"
+    echo "Results are saved in the 'output' directory"
+else
+    echo "Scan failed with exit code: $exit_code"
+    exit $exit_code
+fi

services/llm_service.py ADDED Viewed

	@@ -0,0 +1,78 @@

+from typing import Optional
+import openai
+from pathlib import Path
+class LLMService:
+    def __init__(self, api_key: str):
+        """
+        LLMサービスの初期化
+        Args:
+            api_key: OpenAI APIキー
+        """
+        self.api_key = api_key
+        openai.api_key = api_key
+    def create_prompt(self, content: str, query: str) -> str:
+        """
+        プロンプトを生成
+        Args:
+            content: コードの内容
+            query: ユーザーからの質問
+        Returns:
+            生成されたプロンプト
+        """
+        return f"""以下はGitHubリポジトリのコード解析結果です。このコードについて質問に答えてください。
+コード解析結果:
+{content}
+質問: {query}
+できるだけ具体的に、コードの内容を参照しながら回答してください。"""
+    def get_response(self, content: str, query: str) -> tuple[str, Optional[str]]:
+        """
+        LLMを使用して回答を生成
+        Args:
+            content: コードの内容
+            query: ユーザーからの質問
+        Returns:
+            (回答, エラーメッセージ)のタプル
+        """
+        try:
+            prompt = self.create_prompt(content, query)
+            response = openai.ChatCompletion.create(
+                model="gpt-3.5-turbo-16k",
+                messages=[
+                    {
+                        "role": "system",
+                        "content": "あなたはコードアナリストとして、リポジトリの解析と質問への回答を行います。"
+                    },
+                    {
+                        "role": "user",
+                        "content": prompt
+                    }
+                ]
+            )
+            return response.choices[0].message.content, None
+        except Exception as e:
+            return None, f"エラーが発生しました: {str(e)}"
+    @staticmethod
+    def format_code_content(files_content: dict) -> str:
+        """
+        ファイル内容をプロンプト用にフォーマット
+        Args:
+            files_content: ファイルパスと内容の辞書
+        Returns:
+            フォーマットされたテキスト
+        """
+        formatted_content = []
+        for file_path, content in files_content.items():
+            formatted_content.append(
+                f"#ファイルパス\n{file_path}\n------------\n{content}\n"
+            )
+        return "\n".join(formatted_content)

utils/__init__.py ADDED Viewed

File without changes

utils/__pycache__/__init__.cpython-310.pyc ADDED Viewed

Binary file (152 Bytes). View file

utils/__pycache__/content_exporter.cpython-310.pyc ADDED Viewed

Binary file (2.36 kB). View file

utils/__pycache__/file_writer.cpython-310.pyc ADDED Viewed

Binary file (1.13 kB). View file

utils/file_writer.py ADDED Viewed

	@@ -0,0 +1,24 @@

+from pathlib import Path
+from typing import List
+from core.file_scanner import FileInfo
+class FileWriter:
+    def __init__(self, output_file: Path):
+        self.output_file = output_file
+    def write_contents(self, files: List[FileInfo]) -> None:
+        self.output_file.parent.mkdir(parents=True, exist_ok=True)
+        with self.output_file.open('w', encoding='utf-8') as f:
+            for file_info in files:
+                # ファイルパスのセクション
+                f.write("#ファイルパス\n")
+                f.write(str(file_info.path))
+                f.write("\n------------\n")
+                # ファイル内容
+                if file_info.content is not None:
+                    f.write(file_info.content)
+                else:
+                    f.write("# Failed to read content")
+                f.write("\n\n")

utils/logger.py ADDED Viewed

	@@ -0,0 +1,26 @@

+from pathlib import Path
+from typing import List
+from datetime import datetime
+from core.file_scanner import FileInfo
+class ScanLogger:
+    def __init__(self, log_file: Path):
+        self.log_file = log_file
+    def write_log(self, repo_url: str, files: List[FileInfo], stats: dict):
+        """スキャン結果をログファイルに書き込みます"""
+        self.log_file.parent.mkdir(parents=True, exist_ok=True)
+        with self.log_file.open('w', encoding='utf-8') as f:
+            f.write(f"スキャン日時: {datetime.now()}\n")
+            f.write(f"リポジトリ: {repo_url}\n")
+            f.write(f"ファイル数: {len(files)}\n\n")
+            f.write("=== ファイル種類の統計 ===\n")
+            for ext, count in stats.items():
+                f.write(f"{ext}: {count}個\n")
+            f.write("\n")
+            f.write("=== ファイルパス一覧 ===\n")
+            for file_info in files:
+                f.write(f"{file_info.path} ({file_info.formatted_size})\n")