cyclotruc · AbhiRam162105 · Jan 21, 2025 · Jan 23, 2025 · Jan 24, 2025 · Jan 25, 2025
diff --git a/src/gitingest/cli.py b/src/gitingest/cli.py
@@ -1,100 +1,173 @@
-""" Command-line interface for the Gitingest package. """
+"""Command-line interface for the Gitingest package."""
 
 # pylint: disable=no-value-for-parameter
-
 import asyncio
+from pathlib import Path
 
 import click
 
 from gitingest.config import MAX_FILE_SIZE, OUTPUT_FILE_PATH
 from gitingest.repository_ingest import ingest
 
 
+def parse_ignore_file(ignore_file_path: Path) -> set[str]:
+    """
+    Parse the .gitingestignore file and return a set of patterns to ignore.
+
+    Parameters
+    ----------
+    ignore_file_path : Path
+        Path to the .gitingestignore file
+
+    Returns
+    -------
+    set[str]
+        Set of patterns to ignore
+    """
+    if not ignore_file_path.exists():
+        return set()
+
+    with open(ignore_file_path, encoding="utf-8") as f:
+        # Read lines, strip whitespace, and filter out empty lines and comments
+        patterns = {line.strip() for line in f if line.strip() and not line.startswith("#")}
+
+    return patterns
+
+
+def parse_patterns(patterns: tuple[str, ...]) -> set[str]:
+    """
+    Parse patterns from command line arguments.
+    Handles both space-separated patterns in a single string
+    and multiple -e/-i arguments.
+
+    Parameters
+    ----------
+    patterns : tuple[str, ...]
+        Tuple of patterns from command line
+
+    Returns
+    -------
+    set[str]
+        Set of parsed patterns
+    """
+    result = set()
+    for pattern_str in patterns:
+        # Split on spaces and add each pattern
+        result.update(p.strip() for p in pattern_str.split() if p.strip())
+    return result
+
+
 @click.command()
 @click.argument("source", type=str, default=".")
 @click.option("--output", "-o", default=None, help="Output file path (default: <repo_name>.txt in current directory)")
 @click.option("--max-size", "-s", default=MAX_FILE_SIZE, help="Maximum file size to process in bytes")
-@click.option("--exclude-pattern", "-e", multiple=True, help="Patterns to exclude")
-@click.option("--include-pattern", "-i", multiple=True, help="Patterns to include")
+@click.option("--exclude-pattern", "-e", multiple=True, help="Patterns to exclude (space-separated patterns allowed)")
+@click.option("--include-pattern", "-i", multiple=True, help="Patterns to include (space-separated patterns allowed)")
+@click.option("--ignore-file", default=".gitingestignore", help="Path to ignore file (default: .gitingestignore)")
 def main(
     source: str,
     output: str | None,
     max_size: int,
     exclude_pattern: tuple[str, ...],
     include_pattern: tuple[str, ...],
+    ignore_file: str,
 ):
     """
-    Main entry point for the CLI. This function is called when the CLI is run as a script.
-
-    It calls the async main function to run the command.
+    Main entry point for the CLI.
 
     Parameters
     ----------
     source : str
         The source directory or repository to analyze.
     output : str | None
-        The path where the output file will be written. If not specified, the output will be written
-        to a file named `<repo_name>.txt` in the current directory.
+        The path where the output file will be written. If not specified, the output
+        will be written to a file named `<repo_name>.txt` in the current directory.
     max_size : int
         The maximum file size to process, in bytes. Files larger than this size will be ignored.
     exclude_pattern : tuple[str, ...]
         A tuple of patterns to exclude during the analysis. Files matching these patterns will be ignored.
     include_pattern : tuple[str, ...]
         A tuple of patterns to include during the analysis. Only files matching these patterns will be processed.
+    ignore_file : str
+        Path to the ignore file containing additional patterns to exclude.
     """
-    # Main entry point for the CLI. This function is called when the CLI is run as a script.
-    asyncio.run(_async_main(source, output, max_size, exclude_pattern, include_pattern))
+    asyncio.run(async_main(source, output, max_size, exclude_pattern, include_pattern, ignore_file))
 
 
-async def _async_main(
+async def async_main(
     source: str,
     output: str | None,
     max_size: int,
     exclude_pattern: tuple[str, ...],
     include_pattern: tuple[str, ...],
+    ignore_file: str,
 ) -> None:
     """
     Analyze a directory or repository and create a text dump of its contents.
 
-    This command analyzes the contents of a specified source directory or repository, applies custom include and
-    exclude patterns, and generates a text summary of the analysis which is then written to an output file.
+    This command analyzes the contents of a specified source directory or repository,
+    applies custom include and exclude patterns, and generates a text summary of the
+    analysis which is then written to an output file.
 
     Parameters
     ----------
     source : str
         The source directory or repository to analyze.
     output : str | None
-        The path where the output file will be written. If not specified, the output will be written
-        to a file named `<repo_name>.txt` in the current directory.
+        The path where the output file will be written. If not specified, the output
+        will be written to a file named `<repo_name>.txt` in the current directory.
     max_size : int
         The maximum file size to process, in bytes. Files larger than this size will be ignored.
     exclude_pattern : tuple[str, ...]
         A tuple of patterns to exclude during the analysis. Files matching these patterns will be ignored.
     include_pattern : tuple[str, ...]
         A tuple of patterns to include during the analysis. Only files matching these patterns will be processed.
+    ignore_file : str
+        Path to the ignore file containing additional patterns to exclude.
 
     Raises
     ------
     Abort
         If there is an error during the execution of the command, this exception is raised to abort the process.
     """
     try:
-        # Combine default and custom ignore patterns
-        exclude_patterns = set(exclude_pattern)
-        include_patterns = set(include_pattern)
+        # Get repository name from source path
+        repo_name = Path(source).name or "repository"
 
+        # Set default output filename if not provided
         if not output:
-            output = OUTPUT_FILE_PATH
-        summary, _, _ = await ingest(source, max_size, include_patterns, exclude_patterns, output=output)
+            output = f"{repo_name}.txt"
 
+        # Parse command line patterns
+        exclude_patterns = parse_patterns(exclude_pattern)
+        include_patterns = parse_patterns(include_pattern)
+
+        # Read and add patterns from ignore file
+        ignore_file_path = Path(source) / ignore_file
+        ignore_patterns = parse_ignore_file(ignore_file_path)
+        exclude_patterns.update(ignore_patterns)
+
+        # Perform the ingest operation
+        summary, *_ = await ingest(source, max_size, include_patterns, exclude_patterns, output=output)
+
+        # Display results
         click.echo(f"Analysis complete! Output written to: {output}")
         click.echo("\nSummary:")
         click.echo(summary)
 
-    except Exception as e:
-        click.echo(f"Error: {e}", err=True)
+    except FileNotFoundError as e:
+        click.echo(f"Error: Source directory not found - {e}", err=True)
+        raise click.Abort()
+    except PermissionError as e:
+        click.echo(f"Error: Permission denied - {e}", err=True)
         raise click.Abort()
+    except Exception as e:
+        click.echo(f"Warning: An error occurred - {e}", err=True)
+        # For non-critical errors, we might want to continue rather than abort
+        if isinstance(e, (OSError, IOError)):
+            raise click.Abort()
+        return
 
 
 if __name__ == "__main__":
-    main()
+    main()