diff --git a/.cursorrules b/.cursor/index.mdc similarity index 95% rename from .cursorrules rename to .cursor/index.mdc index 3ebccca..5b9200b 100644 --- a/.cursorrules +++ b/.cursor/index.mdc @@ -1,3 +1,7 @@ +--- +alwaysApply: true +--- + # repo-to-text ## Project Overview diff --git a/AGENTS.md b/AGENTS.md new file mode 120000 index 0000000..94443be --- /dev/null +++ b/AGENTS.md @@ -0,0 +1 @@ +.cursor/index.mdc \ No newline at end of file diff --git a/CLAUDE.md b/CLAUDE.md new file mode 120000 index 0000000..94443be --- /dev/null +++ b/CLAUDE.md @@ -0,0 +1 @@ +.cursor/index.mdc \ No newline at end of file diff --git a/pyproject.toml b/pyproject.toml index 19e9e99..ff44c8d 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -4,7 +4,7 @@ build-backend = "hatchling.build" [project] name = "repo-to-text" -version = "0.7.0" +version = "0.8.0" authors = [ { name = "Kirill Markin", email = "markinkirill@gmail.com" }, ] diff --git a/repo_to_text/core/core.py b/repo_to_text/core/core.py index 6dfcda9..ccc9460 100644 --- a/repo_to_text/core/core.py +++ b/repo_to_text/core/core.py @@ -4,6 +4,7 @@ Core functionality for repo-to-text import os import subprocess +import platform from typing import Tuple, Optional, List, Dict, Any, Set from datetime import datetime, timezone from importlib.machinery import ModuleSpec @@ -36,12 +37,20 @@ def get_tree_structure( def run_tree_command(path: str) -> str: """Run the tree command and return its output.""" + if platform.system() == "Windows": + cmd = ["cmd", "/c", "tree", "/a", "/f", path] + else: + cmd = ["tree", "-a", "-f", "--noreport", path] + result = subprocess.run( - ['tree', '-a', '-f', '--noreport', path], + cmd, stdout=subprocess.PIPE, + stderr=subprocess.PIPE, + text=True, + encoding='utf-8', check=True ) - return result.stdout.decode('utf-8') + return result.stdout def filter_tree_output( tree_output: str, @@ -343,6 +352,33 @@ def save_repo_to_text( return output_filepaths[0] return "" +def _read_file_content(file_path: str) -> str: + """Read file content, handling binary files and broken symlinks. + + Args: + file_path: Path to the file to read + + Returns: + str: File content or appropriate message for special cases + """ + try: + with open(file_path, 'r', encoding='utf-8') as f: + return f.read() + except UnicodeDecodeError: + logging.debug('Handling binary file contents: %s', file_path) + with open(file_path, 'rb') as f_bin: + binary_content: bytes = f_bin.read() + return binary_content.decode('latin1') + except FileNotFoundError as e: + # Minimal handling for bad symlinks + if os.path.islink(file_path) and not os.path.exists(file_path): + try: + target = os.readlink(file_path) + except OSError: + target = '' + return f"[symlink] -> {target}" + raise e + def generate_output_content( path: str, @@ -417,17 +453,8 @@ def generate_output_content( cleaned_relative_path = relative_path.replace('./', '', 1) _add_chunk_to_output(f'\n\n') - - try: - with open(file_path, 'r', encoding='utf-8') as f: - file_content = f.read() - _add_chunk_to_output(file_content) - except UnicodeDecodeError: - logging.debug('Handling binary file contents: %s', file_path) - with open(file_path, 'rb') as f_bin: - binary_content: bytes = f_bin.read() - _add_chunk_to_output(binary_content.decode('latin1')) # Add decoded binary - + file_content = _read_file_content(file_path) + _add_chunk_to_output(file_content) _add_chunk_to_output('\n\n') _add_chunk_to_output('\n\n')