Source code for tzst.cli

Name: tzst
Rating: 5 (1 reviews)
Author: Xi Xu
"""Command-line interface for tzst."""

import argparse
import json
import sys
from pathlib import Path
from typing import Any, Literal, cast

from . import __version__
from .core import (
    ConflictResolution,
    create_archive,
    extract_archive,
    list_archive,
    test_archive,
)
from .exceptions import TzstArchiveError, TzstDecompressionError


def _normalize_archive_path(archive_path: Path) -> Path:
    """Normalize archive path by ensuring correct extension.

    This exactly mirrors the logic in core.py's create_archive function to show
    the correct final path in CLI output.

    Args:
        archive_path: Input archive path

    Returns:
        Path: Normalized path with correct extension
    """
    # Convert to Path if it's not already
    archive_path = Path(archive_path)

    # Ensure archive has correct extension - this logic exactly matches core.py
    if archive_path.suffix.lower() not in [".tzst", ".zst"]:
        if archive_path.suffix.lower() == ".tar":
            archive_path = archive_path.with_suffix(".tar.zst")
        else:
            archive_path = archive_path.with_suffix(archive_path.suffix + ".tzst")

    return archive_path


def _interactive_conflict_callback(target_path: Path) -> ConflictResolution:
    """Interactive callback for handling file conflicts in CLI.

    Args:
        target_path: Path of the conflicting file

    Returns:
        ConflictResolution: User's choice for handling the conflict
    """
    print(f"\nFile already exists: {target_path}")
    print("Choose an action:")
    print("  [R] Replace")
    print("  [N] Do not replace (skip)")
    print("  [A] Replace all")
    print("  [S] Skip all")
    print("  [U] Auto-rename all")
    print("  [X] Exit")

    while True:
        try:
            choice = input("Enter choice [R/N/A/S/U/X]: ").strip().upper()

            if choice == "R":
                return ConflictResolution.REPLACE
            elif choice == "N":
                return ConflictResolution.SKIP
            elif choice == "A":
                return ConflictResolution.REPLACE_ALL
            elif choice == "S":
                return ConflictResolution.SKIP_ALL
            elif choice == "U":
                return ConflictResolution.AUTO_RENAME_ALL
            elif choice == "X":
                return ConflictResolution.EXIT
            else:
                print("Invalid choice. Please enter R, N, A, S, U, or X.")
        except (EOFError, KeyboardInterrupt):
            print("\nOperation cancelled by user")
            return ConflictResolution.EXIT



[docs]
def print_banner() -> None:
    """Print the version and copyright banner.

    Displays the tzst version number and copyright information to stdout.
    Used as a header for CLI operations.

    Returns:
        None
    """
    print()
    print(f"tzst {__version__} : Copyright (c) Xi Xu")
    print()



def _wants_json_output(args) -> bool:
    """Return True when the caller requested machine-readable output."""
    return bool(getattr(args, "json_output", False))


def _emit_json(payload: dict[str, Any], *, to_stderr: bool = False) -> None:
    """Emit a JSON payload to stdout or stderr."""
    stream = sys.stderr if to_stderr else sys.stdout
    print(json.dumps(payload, ensure_ascii=True), file=stream)


def _emit_error(
    args,
    message: str,
    *,
    error_type: str,
    exit_code: int = 1,
    details: dict[str, Any] | None = None,
) -> int:
    """Emit an error in text or JSON format and return the exit code."""
    if _wants_json_output(args):
        payload: dict[str, Any] = {
            "ok": False,
            "error": {"type": error_type, "message": message},
        }
        if details:
            payload["error"]["details"] = details
        _emit_json(payload, to_stderr=True)
    else:
        print(message, file=sys.stderr)
    return exit_code


def _summarize_listing(contents: list[dict[str, Any]]) -> dict[str, int | str]:
    """Build the summary block used by list output."""
    total_files = 0
    total_dirs = 0
    total_size = 0

    for item in contents:
        if item["is_file"]:
            total_files += 1
            total_size += item["size"]
        elif item["is_dir"]:
            total_dirs += 1

    return {
        "files": total_files,
        "directories": total_dirs,
        "total_size_bytes": total_size,
        "total_size_human": format_size(total_size),
    }


def _should_print_banner(argv: list[str] | None) -> bool:
    """Determine whether the human-facing banner should be displayed."""
    cli_args = argv if argv is not None else sys.argv[1:]
    return "--json" not in cli_args and "--no-banner" not in cli_args



[docs]
def format_size(size: int) -> str:
    """Format file size in human-readable format.

    Converts byte values to human-readable format using standard units
    (B, KB, MB, GB, TB, PB) with appropriate decimal places.

    Args:
        size (int): Size in bytes to format

    Returns:
        str: Formatted size string with units (e.g., "1.5 KB", "2.3 GB")

    Examples:
        >>> format_size(1024)
        '  1.0 KB'
        >>> format_size(1536)
        '  1.5 KB'
        >>> format_size(2048576)
        '  2.0 MB'
    """
    size_float = float(size)
    for unit in ["B", "KB", "MB", "GB", "TB"]:
        if size_float < 1024.0:
            return f"{size_float:6.1f} {unit}"
        size_float /= 1024.0
    return f"{size_float:6.1f} PB"




[docs]
def validate_compression_level(value: str) -> int:
    """Validate and return compression level.

    Args:
        value: String value from command line

    Returns:
        int: Valid compression level (1-22)

    Raises:
        argparse.ArgumentTypeError: If value is not a valid compression level
    """
    try:
        level = int(value)
        if not 1 <= level <= 22:
            raise argparse.ArgumentTypeError(
                f"Invalid compression level: {level}. Must be between 1 and 22."
            )
        return level
    except ValueError:
        raise argparse.ArgumentTypeError(
            f"Invalid compression level: '{value}'. "
            f"Must be an integer between 1 and 22."
        ) from None



def _process_file_paths(file_args: list[str]) -> list[Path]:
    """Process file arguments into resolved Path objects.

    Args:
        file_args: List of file path strings from command line

    Returns:
        list[Path]: List of resolved Path objects
    """
    files: list[Path] = []
    for file_arg in file_args:
        file_path = Path(file_arg).resolve()
        files.append(file_path)
    return files


def _validate_files(files: list[Path]) -> list[Path]:
    """Validate that files exist and are accessible.

    Args:
        files: List of Path objects to validate

    Returns:
        list[Path]: List of missing files (empty if all files exist)

    Raises:
        OSError: If a file cannot be accessed due to permissions or invalid characters
    """
    missing_files = []
    for f in files:
        try:
            if not f.exists():
                missing_files.append(f)
        except OSError as e:
            # Handle path issues (invalid characters, permissions, etc.)
            print(f"Error: Cannot access file '{f}' - {e}", file=sys.stderr)
            raise
    return missing_files


def _extract_add_params(args) -> tuple[int, bool]:
    """Extract compression parameters from arguments.

    Args:
        args: Parsed command line arguments

    Returns:
        tuple[int, bool]: (compression_level, use_temp_file)
    """
    compression_level = getattr(args, "compression_level", 3)
    use_temp_file = not getattr(args, "no_atomic", False)
    return compression_level, use_temp_file


def _prepare_archive_creation(args) -> tuple[Path, list[Path], int, bool] | int:
    """Prepare and validate inputs for archive creation.

    Args:
        args: Parsed command line arguments

    Returns:
        tuple or int: Either (archive_path, files, compression_level, use_temp_file)
                     or error code if validation fails
    """
    archive_path = Path(args.archive)
    files = _process_file_paths(args.files)

    # Validate files
    missing_files = _validate_files(files)
    if missing_files:
        return _emit_error(
            args,
            f"Error: Files not found - {', '.join(map(str, missing_files))}",
            error_type="files_not_found",
            details={"missing_files": [str(path) for path in missing_files]},
        )

    compression_level, use_temp_file = _extract_add_params(args)
    return archive_path, files, compression_level, use_temp_file


def _execute_archive_creation(
    args,
    archive_path: Path,
    files: list[Path],
    compression_level: int,
    use_temp_file: bool,
) -> int:
    """Execute the archive creation process.

    Args:
        archive_path: Path where archive will be created
        files: List of files to add to archive
        compression_level: Compression level to use
        use_temp_file: Whether to use atomic file operations

    Returns:
        int: Exit code (0 for success, non-zero for failure)
    """
    # Normalize archive path to show the correct final filename
    normalized_archive_path = _normalize_archive_path(archive_path)

    if not _wants_json_output(args):
        print(f"Creating archive: {normalized_archive_path}")
        for file_path in files:
            print(f"  Adding: {file_path}")

    # Use atomic file operations by default for better reliability
    # This creates the archive in a temporary file first, then moves it
    create_archive(archive_path, files, compression_level, use_temp_file=use_temp_file)

    if _wants_json_output(args):
        _emit_json(
            {
                "ok": True,
                "command": "add",
                "archive": str(archive_path),
                "normalized_archive": str(normalized_archive_path),
                "added": [str(file_path) for file_path in files],
                "compression_level": compression_level,
                "atomic": use_temp_file,
            }
        )
    else:
        print(f"Archive created successfully - {normalized_archive_path}")

    return 0


def _handle_archive_creation_exceptions(command_args, func, *args, **kwargs) -> int:
    """Handle exceptions during archive creation.

    Args:
        func: Function to execute
        *args: Positional arguments for func
        **kwargs: Keyword arguments for func

    Returns:
        int: Exit code based on exception type
    """
    try:
        return func(*args, **kwargs)
    except OSError:
        return 1  # Error already printed in _validate_files
    except ValueError as e:
        return _emit_error(
            command_args,
            f"Error: Invalid parameter - {e}",
            error_type="invalid_parameter",
        )
    except TzstArchiveError as e:
        return _emit_error(
            command_args,
            f"Error: Archive operation failed - {e}",
            error_type="archive_operation_failed",
        )
    except KeyboardInterrupt:
        return _emit_error(
            command_args,
            "Operation interrupted by user",
            error_type="interrupted",
            exit_code=130,
        )
        # Clean up any partial files - the atomic operations in create_archive
        # handle this
    except Exception as e:
        return _emit_error(
            command_args,
            f"Error: Failed to create archive - {e}",
            error_type="create_failed",
        )



[docs]
def cmd_add(args) -> int:
    """Command handler for creating/adding to archives.

    Processes the 'add', 'create', or 'a' CLI commands to create new tzst archives
    with the specified files and directories. Uses atomic file operations by
    default to ensure data integrity.

    Args:
        args: Parsed command line arguments containing:
            - archive (str): Path to the archive file to create
            - files (list[str]): List of files/directories to add
            - compression_level (int, optional): Compression level 1-22
            - no_atomic (bool, optional): Disable atomic file operations

    Returns:
        int: Exit code (0 for success, non-zero for failure)
            - 0: Success
            - 1: File not found, invalid parameters, or archive operation failed
            - 130: Operation interrupted by user (Ctrl+C)

    Note:
        This function uses atomic file operations by default, creating the
        archive in a temporary file first, then atomically moving it to the
        final location to prevent incomplete archives.

    See Also:
        :func:`tzst.create_archive`: The underlying function for archive creation
        :meth:`TzstArchive.add`: The core method for adding files to archives
    """

    def _create_archive_workflow():
        preparation_result = _prepare_archive_creation(args)
        if isinstance(preparation_result, int):
            return preparation_result

        archive_path, files, compression_level, use_temp_file = preparation_result
        return _execute_archive_creation(
            args, archive_path, files, compression_level, use_temp_file
        )

    return _handle_archive_creation_exceptions(args, _create_archive_workflow)




[docs]
def cmd_extract_full(args) -> int:
    """Command handler for extracting archives with full directory structure.

    Processes the 'extract' or 'x' CLI commands to extract files from tzst
    archives while preserving the original directory structure.

    Args:
        args: Parsed command line arguments containing:
            - archive (str): Path to the archive file to extract
            - output (str, optional): Output directory path
            - files (list[str], optional): Specific files to extract
            - streaming (bool, optional): Use streaming mode for large archives
            - filter (str, optional): Security filter ('data', 'tar', 'fully_trusted')

    Returns:
        int: Exit code (0 for success, non-zero for failure)
            - 0: Success
            - 1: File not found, decompression failed, or archive operation failed
            - 130: Operation interrupted by user (Ctrl+C)

    Note:
        Uses the 'data' security filter by default for safe extraction from
        untrusted sources. Streaming mode is recommended for archives > 100MB.

    See Also:
        :func:`tzst.extract_archive`: The underlying function for extraction
        :meth:`TzstArchive.extract`: The core method for extracting from archives
        :func:`cmd_extract_flat`: For flat extraction without directory structure
    """
    try:
        archive_path = Path(args.archive)
        if not archive_path.exists():
            return _emit_error(
                args,
                f"Error: Archive not found - {archive_path}",
                error_type="archive_not_found",
                details={"archive": str(archive_path)},
            )

        output_dir = Path(args.output) if args.output else Path.cwd()
        members = args.files if hasattr(args, "files") and args.files else None
        streaming = getattr(args, "streaming", False)
        filter_type = cast(
            Literal["data", "tar", "fully_trusted"], getattr(args, "filter", "data")
        )

        # Handle conflict resolution parameters
        conflict_resolution_str = getattr(args, "conflict_resolution", "ask")
        interactive_flag = getattr(args, "interactive", False)

        # If --interactive is specified, use "ask" regardless of --conflict-resolution
        if interactive_flag:
            conflict_resolution_str = "ask"

        # Convert string to ConflictResolution enum
        conflict_resolution = ConflictResolution(conflict_resolution_str)

        if _wants_json_output(args) and conflict_resolution == ConflictResolution.ASK:
            return _emit_error(
                args,
                "Error: JSON mode does not support interactive conflict prompts",
                error_type="interactive_conflict_not_supported",
            )

        # Set up interactive callback if needed
        interactive_callback = None
        if conflict_resolution == ConflictResolution.ASK:
            interactive_callback = _interactive_conflict_callback

        if not _wants_json_output(args):
            print(f"Extracting from: {archive_path}")
            print(f"Output directory: {output_dir}")
            if streaming:
                print("Using streaming mode (memory efficient)")
            if filter_type != "data":
                print(f"Using security filter: {filter_type}")
            if conflict_resolution != ConflictResolution.REPLACE:
                print(f"Conflict resolution: {conflict_resolution.value}")

        extract_archive(
            archive_path,
            output_dir,
            members,
            flatten=False,
            streaming=streaming,
            filter=filter_type,
            conflict_resolution=conflict_resolution,
            interactive_callback=interactive_callback,
        )

        if _wants_json_output(args):
            _emit_json(
                {
                    "ok": True,
                    "command": "extract",
                    "archive": str(archive_path),
                    "output_dir": str(output_dir),
                    "members": members or [],
                    "flatten": False,
                    "streaming": streaming,
                    "filter": filter_type,
                    "conflict_resolution": conflict_resolution.value,
                }
            )
        else:
            print("Extraction completed successfully")
        return 0

    except FileNotFoundError as e:
        return _emit_error(
            args,
            f"Error: File not found - {e}",
            error_type="file_not_found",
        )
    except TzstDecompressionError as e:
        return _emit_error(
            args,
            f"Error: Archive decompression failed - {e}",
            error_type="decompression_failed",
        )
    except TzstArchiveError as e:
        return _emit_error(
            args,
            f"Error: Archive operation failed - {e}",
            error_type="archive_operation_failed",
        )
    except KeyboardInterrupt:
        return _emit_error(
            args,
            "Operation interrupted by user",
            error_type="interrupted",
            exit_code=130,
        )
    except Exception as e:
        return _emit_error(
            args,
            f"Error: Failed to extract archive - {e}",
            error_type="extract_failed",
        )




[docs]
def cmd_extract_flat(args) -> int:
    """Command handler for flat extraction without directory structure.

    Processes the 'extract-flat' or 'e' CLI commands to extract files from
    tzst archives without preserving directory structure (all files extracted
    to a single directory).

    Args:
        args: Parsed command line arguments containing:
            - archive (str): Path to the archive file to extract
            - output (str, optional): Output directory path
            - files (list[str], optional): Specific files to extract
            - streaming (bool, optional): Use streaming mode for large archives
            - filter (str, optional): Security filter ('data', 'tar', 'fully_trusted')

    Returns:
        int: Exit code (0 for success, non-zero for failure)
            - 0: Success
            - 1: File not found, decompression failed, or archive operation failed
            - 130: Operation interrupted by user (Ctrl+C)

    Warning:
        Flat extraction may cause filename conflicts if multiple files have
        the same name but are in different directories within the archive.

    See Also:
        :func:`tzst.extract_archive`: The underlying function for extraction
        :meth:`TzstArchive.extract`: The core method for extracting from archives
        :func:`cmd_extract_full`: For extraction with directory structure
    """
    try:
        archive_path = Path(args.archive)
        if not archive_path.exists():
            return _emit_error(
                args,
                f"Error: Archive not found - {archive_path}",
                error_type="archive_not_found",
                details={"archive": str(archive_path)},
            )

        output_dir = Path(args.output) if args.output else Path.cwd()
        members = args.files if hasattr(args, "files") and args.files else None
        streaming = getattr(args, "streaming", False)
        filter_type = cast(
            Literal["data", "tar", "fully_trusted"], getattr(args, "filter", "data")
        )

        # Handle conflict resolution parameters
        conflict_resolution_str = getattr(args, "conflict_resolution", "ask")
        interactive_flag = getattr(args, "interactive", False)

        # If --interactive is specified, use "ask" regardless of --conflict-resolution
        if interactive_flag:
            conflict_resolution_str = "ask"

        # Convert string to ConflictResolution enum
        conflict_resolution = ConflictResolution(conflict_resolution_str)

        if _wants_json_output(args) and conflict_resolution == ConflictResolution.ASK:
            return _emit_error(
                args,
                "Error: JSON mode does not support interactive conflict prompts",
                error_type="interactive_conflict_not_supported",
            )

        # Set up interactive callback if needed
        interactive_callback = None
        if conflict_resolution == ConflictResolution.ASK:
            interactive_callback = _interactive_conflict_callback

        if not _wants_json_output(args):
            print(f"Extracting from: {archive_path}")
            print(f"Output directory: {output_dir}")
            if filter_type != "data":
                print(f"Using security filter: {filter_type}")
            if conflict_resolution != ConflictResolution.REPLACE:
                print(f"Conflict resolution: {conflict_resolution.value}")

        extract_archive(
            archive_path,
            output_dir,
            members,
            flatten=True,
            streaming=streaming,
            filter=filter_type,
            conflict_resolution=conflict_resolution,
            interactive_callback=interactive_callback,
        )

        if _wants_json_output(args):
            _emit_json(
                {
                    "ok": True,
                    "command": "extract-flat",
                    "archive": str(archive_path),
                    "output_dir": str(output_dir),
                    "members": members or [],
                    "flatten": True,
                    "streaming": streaming,
                    "filter": filter_type,
                    "conflict_resolution": conflict_resolution.value,
                }
            )
        else:
            print("Extraction completed successfully")
        return 0

    except FileNotFoundError as e:
        return _emit_error(
            args,
            f"Error: File not found - {e}",
            error_type="file_not_found",
        )
    except TzstDecompressionError as e:
        return _emit_error(
            args,
            f"Error: Archive decompression failed - {e}",
            error_type="decompression_failed",
        )
    except TzstArchiveError as e:
        return _emit_error(
            args,
            f"Error: Archive operation failed - {e}",
            error_type="archive_operation_failed",
        )
    except Exception as e:
        return _emit_error(
            args,
            f"Error: Failed to extract archive - {e}",
            error_type="extract_failed",
        )



def _print_verbose_listing(contents: list) -> None:
    """Print detailed listing of archive contents.

    Args:
        contents: List of archive items with metadata
    """
    print(f"{'Mode':<10} {'Size':<10} {'Modified':<20} {'Name'}")
    print("-" * 60)
    for item in contents:
        mode_str = oct(item.get("mode", 0))[-4:] if item.get("mode") else "----"
        size_str = format_size(item["size"]) if item["is_file"] else "<DIR>"
        mtime_str = item.get("mtime_str", "")[:19] if item.get("mtime_str") else ""
        print(f"{mode_str:<10} {size_str:<10} {mtime_str:<20} {item['name']}")


def _print_simple_listing(contents: list) -> None:
    """Print simple listing of archive contents with summary.

    Args:
        contents: List of archive items
    """
    for item in contents:
        print(item["name"])

    print()
    summary = _summarize_listing(contents)
    total_msg = (
        f"Total: {summary['files']} files, {summary['directories']} directories, "
        f"{summary['total_size_human']}"
    )
    print(total_msg)



[docs]
def cmd_list(args) -> int:
    """Command handler for listing archive contents.

    Processes the 'list' or 'l' CLI commands to display the contents of tzst
    archives. Supports both simple and verbose listing modes.

    Args:
        args: Parsed command line arguments containing:
            - archive (str): Path to the archive file to list
            - verbose (bool, optional): Show detailed file information
            - streaming (bool, optional): Use streaming mode for large archives

    Returns:
        int: Exit code (0 for success, non-zero for failure)
            - 0: Success
            - 1: File not found, decompression failed, or archive operation failed
            - 130: Operation interrupted by user (Ctrl+C)

    Note:
        Verbose mode displays file permissions, sizes, modification times,
        and other metadata. Streaming mode is recommended for archives > 100MB.

    See Also:
        :func:`tzst.list_archive`: The underlying function for listing contents
        :meth:`TzstArchive.list`: The core method for listing archive contents
    """
    try:
        archive_path = Path(args.archive)
        if not archive_path.exists():
            return _emit_error(
                args,
                f"Error: Archive not found - {archive_path}",
                error_type="archive_not_found",
                details={"archive": str(archive_path)},
            )

        verbose = getattr(args, "verbose", False)
        streaming = getattr(args, "streaming", False)

        if not _wants_json_output(args):
            print(f"Listing contents of: {archive_path}")
            if streaming:
                print("Using streaming mode (memory efficient)")
            print()

        contents = list_archive(archive_path, verbose=verbose, streaming=streaming)

        if _wants_json_output(args):
            _emit_json(
                {
                    "ok": True,
                    "command": "list",
                    "archive": str(archive_path),
                    "verbose": verbose,
                    "streaming": streaming,
                    "contents": contents,
                    "summary": _summarize_listing(contents),
                }
            )
        elif verbose:
            _print_verbose_listing(contents)
        else:
            _print_simple_listing(contents)

        return 0

    except FileNotFoundError as e:
        return _emit_error(
            args,
            f"Error: File not found - {e}",
            error_type="file_not_found",
        )
    except TzstDecompressionError as e:
        return _emit_error(
            args,
            f"Error: Archive decompression failed - {e}",
            error_type="decompression_failed",
        )
    except TzstArchiveError as e:
        return _emit_error(
            args,
            f"Error: Archive operation failed - {e}",
            error_type="archive_operation_failed",
        )
    except KeyboardInterrupt:
        return _emit_error(
            args,
            "Operation interrupted by user",
            error_type="interrupted",
            exit_code=130,
        )
    except Exception as e:
        return _emit_error(
            args,
            f"Error: Failed to list archive - {e}",
            error_type="list_failed",
        )




[docs]
def cmd_test(args) -> int:
    """Command handler for testing archive integrity.

    Processes the 'test' or 't' CLI commands to verify the integrity of tzst
    archives by attempting to read all files and checking for corruption.

    Args:
        args: Parsed command line arguments containing:
            - archive (str): Path to the archive file to test
            - streaming (bool, optional): Use streaming mode for large archives

    Returns:
        int: Exit code (0 for success, non-zero for failure)
            - 0: Archive passed integrity test
            - 1: Archive failed integrity test, file not found, or operation failed
            - 130: Operation interrupted by user (Ctrl+C)

    Note:
        This command verifies that the archive can be read and all files
        can be decompressed without errors. Streaming mode is recommended
        for archives > 100MB to reduce memory usage.

    See Also:
        :func:`tzst.test_archive`: The underlying function for integrity testing
        :meth:`TzstArchive.test`: The core method for testing archive integrity
    """
    try:
        archive_path = Path(args.archive)
        if not archive_path.exists():
            return _emit_error(
                args,
                f"Error: Archive not found - {archive_path}",
                error_type="archive_not_found",
                details={"archive": str(archive_path)},
            )

        streaming = getattr(args, "streaming", False)

        if not _wants_json_output(args):
            print(f"Testing archive: {archive_path}")
            if streaming:
                print("Using streaming mode (memory efficient)")

        healthy = test_archive(archive_path, streaming=streaming)
        if healthy:
            if _wants_json_output(args):
                _emit_json(
                    {
                        "ok": True,
                        "command": "test",
                        "archive": str(archive_path),
                        "streaming": streaming,
                        "healthy": True,
                    }
                )
            else:
                print("Archive test passed - no errors detected")
            return 0
        else:
            return _emit_error(
                args,
                "Archive test failed - errors detected",
                error_type="integrity_check_failed",
                details={
                    "command": "test",
                    "archive": str(archive_path),
                    "streaming": streaming,
                    "healthy": False,
                },
            )

    except FileNotFoundError as e:
        return _emit_error(
            args,
            f"Error: File not found - {e}",
            error_type="file_not_found",
        )
    except TzstDecompressionError as e:
        return _emit_error(
            args,
            f"Error: Archive decompression failed - {e}",
            error_type="decompression_failed",
        )
    except TzstArchiveError as e:
        return _emit_error(
            args,
            f"Error: Archive operation failed - {e}",
            error_type="archive_operation_failed",
        )
    except KeyboardInterrupt:
        return _emit_error(
            args,
            "Operation interrupted by user",
            error_type="interrupted",
            exit_code=130,
        )
    except Exception as e:
        return _emit_error(
            args,
            f"Error: Failed to test archive - {e}",
            error_type="test_failed",
        )




[docs]
def cmd_version(args) -> int:
    """Command handler for version display.

    Returns:
        int: Exit code (always 0)
    """
    if _wants_json_output(args):
        _emit_json({"ok": True, "command": "version", "version": __version__})
    elif getattr(args, "no_banner", False):
        print(f"tzst {__version__}")

    return 0




[docs]
def create_parser() -> argparse.ArgumentParser:
    """Create and configure the command-line argument parser.

    Sets up the argparse ArgumentParser with all subcommands and their
    respective arguments for the tzst CLI interface. Includes comprehensive
    help text and command reference documentation.

    Returns:
        argparse.ArgumentParser: Configured parser ready for argument parsing

    Note:
        The parser is configured with RawDescriptionHelpFormatter to preserve
        formatting in the epilog help text, and includes detailed command
        reference and security notes.

    Commands Created:
        - a, add, create: Archive creation with compression levels
        - x, extract: Full extraction with directory structure
        - e, extract-flat: Flat extraction without directories
        - l, list: Archive content listing
        - t, test: Archive integrity testing

    See Also:
        :func:`main`: The main entry point that uses this parser
    """
    epilog = """
command reference:
  archive:
    a, add, create    tzst a archive.tzst files...  [-l LEVEL] [--no-atomic]

  extract:
    x, extract        tzst x archive.tzst [files...] [-o DIR] [--streaming] [--filter FILTER]
    e, extract-flat   tzst e archive.tzst [files...] [-o DIR] [--streaming] [--filter FILTER]

  manage:
    l, list           tzst l archive.tzst [-v] [--streaming]
    t, test           tzst t archive.tzst [--streaming]

arguments:
  -l, --level LEVEL   compression level (1-22, default: 3)
  -o, --output DIR    output directory (default: current directory)
  -v, --verbose       show detailed information
  --streaming         use streaming mode for memory efficiency with large archives
  --filter FILTER     security filter for extraction: data (safest, default), tar, fully_trusted
  --no-atomic         disable atomic file operations (not recommended)

security note:
  always use --filter=data (default) when extracting archives from untrusted sources
  never use --filter=fully_trusted unless you completely trust the archive source

documentation:
  https://tzst.xi-xu.me
"""
    parser = argparse.ArgumentParser(
        prog="tzst",
        epilog=epilog,
        formatter_class=argparse.RawDescriptionHelpFormatter,
        add_help=True,
    )
    parser.add_argument(
        "--version", action="store_true", help="show version information and exit"
    )
    parser.add_argument(
        "--json",
        dest="json_output",
        action="store_true",
        help="emit machine-readable JSON output",
    )
    parser.add_argument(
        "--no-banner",
        action="store_true",
        help="suppress the startup banner",
    )

    # Add global arguments
    subparsers = parser.add_subparsers(
        dest="command", title="commands", metavar="COMMAND"
    )

    # Add/Create command
    parser_add = subparsers.add_parser(
        "a", aliases=["add", "create"], help="add files to archive"
    )
    parser_add.add_argument("archive", help="archive file path")
    parser_add.add_argument("files", nargs="+", help="files/directories to add")
    parser_add.add_argument(
        "-c",
        "-l",
        "--level",
        dest="compression_level",
        type=validate_compression_level,
        default=3,
        metavar="LEVEL",
        help="compression level (1-22, default: 3)",
    )
    parser_add.add_argument(
        "--no-atomic",
        action="store_true",
        help=(
            "Disable atomic file operations (not recommended - creates archive "
            "directly without temporary file)"
        ),
    )
    parser_add.set_defaults(func=cmd_add)

    # Extract with full paths command
    parser_extract = subparsers.add_parser(
        "x", aliases=["extract"], help="eXtract files with full paths"
    )
    parser_extract.add_argument("archive", help="archive file path")
    parser_extract.add_argument("files", nargs="*", help="specific files to extract")
    parser_extract.add_argument(
        "-o", "--output", help="output directory (default: current directory)"
    )
    parser_extract.add_argument(
        "--streaming",
        action="store_true",
        help="use streaming mode for memory efficiency with large archives",
    )
    parser_extract.add_argument(
        "--filter",
        choices=["data", "tar", "fully_trusted"],
        default="data",
        help=(
            "Extraction filter for security (default: data). 'data' is safest "
            "for untrusted archives, 'tar' honors most tar features, "
            "'fully_trusted' honors all metadata"
        ),
    )
    parser_extract.add_argument(
        "--conflict-resolution",
        choices=[
            "replace",
            "skip",
            "replace_all",
            "skip_all",
            "auto_rename",
            "auto_rename_all",
            "ask",
        ],
        default="ask",
        help=(
            "How to handle file conflicts during extraction (default: ask). "
            "'ask' prompts for each conflict, 'replace' overwrites existing files, "
            "'skip' skips existing files, 'auto_rename' creates new names. "
            "Adding '_all' applies the action to all subsequent conflicts."
        ),
    )
    parser_extract.set_defaults(func=cmd_extract_full)

    # Extract flat command
    parser_extract_flat = subparsers.add_parser(
        "e",
        aliases=["extract-flat"],
        help="extract files from archive (without using directory names)",
    )
    parser_extract_flat.add_argument("archive", help="archive file path")
    parser_extract_flat.add_argument(
        "files", nargs="*", help="specific files to extract"
    )
    parser_extract_flat.add_argument(
        "-o", "--output", help="output directory (default: current directory)"
    )
    parser_extract_flat.add_argument(
        "--streaming",
        action="store_true",
        help="use streaming mode for memory efficiency with large archives",
    )
    parser_extract_flat.add_argument(
        "--filter",
        choices=["data", "tar", "fully_trusted"],
        default="data",
        help=(
            "Extraction filter for security (default: data). 'data' is safest "
            "for untrusted archives, 'tar' honors most tar features, "
            "'fully_trusted' honors all metadata"
        ),
    )
    parser_extract_flat.add_argument(
        "--conflict-resolution",
        choices=[
            "replace",
            "skip",
            "replace_all",
            "skip_all",
            "auto_rename",
            "auto_rename_all",
            "ask",
        ],
        default="ask",
        help=(
            "How to handle file conflicts during extraction (default: ask). "
            "'ask' prompts for each conflict, 'replace' overwrites existing files, "
            "'skip' skips existing files, 'auto_rename' creates new names. "
            "Adding '_all' applies the action to all subsequent conflicts."
        ),
    )
    parser_extract_flat.set_defaults(func=cmd_extract_flat)

    # List command
    parser_list = subparsers.add_parser(
        "l", aliases=["list"], help="list contents of archive"
    )
    parser_list.add_argument("archive", help="archive file path")
    parser_list.add_argument(
        "-v", "--verbose", action="store_true", help="show detailed information"
    )
    parser_list.add_argument(
        "--streaming",
        action="store_true",
        help="use streaming mode for memory efficiency with large archives",
    )
    parser_list.set_defaults(func=cmd_list)

    # Test command
    parser_test = subparsers.add_parser(
        "t", aliases=["test"], help="test integrity of archive"
    )
    parser_test.add_argument("archive", help="archive file path")
    parser_test.add_argument(
        "--streaming",
        action="store_true",
        help="use streaming mode for memory efficiency with large archives",
    )
    parser_test.set_defaults(func=cmd_test)

    return parser



def _validate_compression_level_in_argv(argv: list[str]) -> bool:
    """Check for compression level validation errors in argv.

    Args:
        argv: Command line arguments

    Returns:
        bool: True if an error was found and handled, False otherwise
    """
    if "-c" not in argv and "-l" not in argv and "--level" not in argv:
        return False

    try:
        level_index = -1
        if "-c" in argv:
            level_index = argv.index("-c")
        elif "-l" in argv:
            level_index = argv.index("-l")
        else:
            level_index = argv.index("--level")
        if level_index + 1 < len(argv):
            level_value = argv[level_index + 1]
            try:
                level = int(level_value)
                if not 1 <= level <= 22:
                    print(
                        f"Invalid compression level: {level}. "
                        f"Must be between 1 and 22.",
                        file=sys.stderr,
                    )
                    return True
            except ValueError:
                print(
                    f"Invalid compression level: '{level_value}'. "
                    f"Must be an integer between 1 and 22.",
                    file=sys.stderr,
                )
                return True
    except (ValueError, IndexError):
        pass
    return False


def _validate_filter_in_argv(argv: list[str]) -> bool:
    """Check for filter validation errors in argv.

    Args:
        argv: Command line arguments

    Returns:
        bool: True if an error was found and handled, False otherwise
    """
    if "--filter" not in argv:
        return False

    try:
        filter_index = argv.index("--filter")
        if filter_index + 1 < len(argv):
            filter_value = argv[filter_index + 1]
            valid_filters = ["data", "tar", "fully_trusted"]
            if filter_value not in valid_filters:
                print(
                    f"Invalid filter specified: {filter_value}. "
                    f"Must be one of: {', '.join(valid_filters)}",
                    file=sys.stderr,
                )
                return True
    except (ValueError, IndexError):
        pass
    return False


def _validate_command_in_argv(argv: list[str]) -> bool:
    """Check for invalid command errors in argv.

    Args:
        argv: Command line arguments

    Returns:
        bool: True if an invalid command was found and handled, False otherwise
    """
    if not argv:
        return False

    # Valid commands and their aliases
    valid_commands = {
        "a",
        "add",
        "create",
        "x",
        "extract",
        "e",
        "extract-flat",
        "l",
        "list",
        "t",
        "test",
    }

    # Find the first argument that's not a flag (doesn't start with -)
    for arg in argv:
        if not arg.startswith("-"):
            if arg not in valid_commands:
                print(
                    f"Invalid command: '{arg}'. "
                    f"Valid commands are: {', '.join(sorted(valid_commands))}",
                    file=sys.stderr,
                )
                return True
            break

    return False


def _is_extreme_compression_level_in_argv(argv: list[str]) -> bool:
    """Check for extreme compression level values that warrant special handling.

    Args:
        argv: Command line arguments

    Returns:
        bool: True if an extreme compression level value is found, False otherwise
    """
    if "-c" not in argv and "-l" not in argv and "--level" not in argv:
        return False

    try:
        level_index = -1
        if "-c" in argv:
            level_index = argv.index("-c")
        elif "-l" in argv:
            level_index = argv.index("-l")
        else:
            level_index = argv.index("--level")
        if level_index + 1 < len(argv):
            level_value = argv[level_index + 1]
            try:
                level = int(level_value)
                # Only consider extreme values (>=1000) for special handling
                return level >= 1000
            except ValueError:
                pass
    except (ValueError, IndexError):
        pass
    return False


def _handle_parsing_errors(e: SystemExit, argv: list[str] | None) -> int:
    """Handle SystemExit exceptions from argument parsing.

    Args:
        e: SystemExit exception from argparse
        argv: Command line arguments, if any

    Returns:
        int: Appropriate exit code
    """  # Help was requested
    if e.code == 0:
        return 0
    elif e.code == 2 and argv:
        # For now, keep standard argparse behavior (exit code 2)
        # Future versions may convert specific validation errors to exit code 1
        pass

    # Return the original exit code for other cases
    return int(e.code) if e.code is not None else 1


def _parse_arguments(parser, argv: list[str] | None):
    """Parse command line arguments with error handling.

    Args:
        parser: The argument parser
        argv: Command line arguments

    Returns:
        tuple: (args, error_code) where error_code is None for success
    """
    try:
        args = parser.parse_args(argv)
        return args, None
    except SystemExit as e:
        return None, _handle_parsing_errors(e, argv)


def _execute_command(args, parser) -> int:
    """Execute the parsed command.

    Args:
        args: Parsed command line arguments
        parser: The argument parser for help display

    Returns:
        int: Exit code from command execution
    """
    # Handle --version flag
    if hasattr(args, "version") and args.version:
        return cmd_version(args)

    if not hasattr(args, "func"):
        parser.print_help()
        return 1

    return args.func(args)



[docs]
def main(argv: list[str] | None = None) -> int:
    """Main entry point for the tzst command-line interface.

    Processes command-line arguments and dispatches to appropriate command
    handlers. Displays the version banner and provides error handling for
    the overall CLI execution.

    Args:
        argv (list[str] | None, optional): Command line arguments to parse.
            If None, uses sys.argv. Defaults to None.

    Returns:
        int: Exit code for the program
            - 0: Success
            - 1: Invalid compression level, filter, or command error
            - 2: Argument parsing error (help, unknown options)
            - Other codes: Specific to individual command handlers

    Note:
        This function serves as the console script entry point defined in
        pyproject.toml. It displays the version banner before executing
        any commands.

    See Also:
        :func:`create_parser`: Creates the argument parser used by this function
    """
    if _should_print_banner(argv):
        print_banner()

    parser = create_parser()
    args, error_code = _parse_arguments(parser, argv)

    if error_code is not None:
        return error_code

    return _execute_command(args, parser)



if __name__ == "__main__":
    sys.exit(main())