Added parallel processing, setup cli, and refactored project structure. - ratchets - Unnamed repository; edit this file 'description' to name the repository.

commit 844a0da541b0b20102e1e865159180e09331336b
parent 895b4fc9a75458ddbd1c9a37d2fe0d6434d23afa
Author: Andrew Laack <andrew@laack.co>
Date:   Wed, 18 Jun 2025 10:43:45 -0500

Added parallel processing, setup cli, and refactored project structure.

Diffstat:
M .gitignore  | 3 ++-
A src/ratchets/__init__.py  | 0 
A src/ratchets/__main__.py  | 3 +++
A src/ratchets/abstracted_tests.py  | 116 +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
A src/ratchets/run_tests.py  | 436 +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
A src/ratchets/test_ratchet.py  | 34 ++++++++++++++++++++++++++++++++++
A src/ratchets/validate.py  | 55 +++++++++++++++++++++++++++++++++++++++++++++++++++++++
D src/run_tests.py  | 445 -------------------------------------------------------------------------------
D src/test_ratchet.py  | 101 -------------------------------------------------------------------------------
D src/validate.py  | 56 --------------------------------------------------------

10 files changed, 646 insertions(+), 603 deletions(-)
diff --git a/.gitignore b/.gitignore
@@ -195,4 +195,5 @@ cython_debug/
 ratchet_values.json
 ratchet_excluded.txt
 *.toml
-tests/
+notes/
+data/
diff --git a/src/ratchets/__init__.py b/src/ratchets/__init__.py
diff --git a/src/ratchets/__main__.py b/src/ratchets/__main__.py
@@ -0,0 +1,3 @@
+from .run_tests import cli
+if __name__ == "__main__":
+    cli()
diff --git a/src/ratchets/abstracted_tests.py b/src/ratchets/abstracted_tests.py
@@ -0,0 +1,116 @@
+import os
+import json
+import toml
+from pathlib import Path
+from typing import Dict, Any, List
+
+from .run_tests import (
+    evaluate_python_tests,
+    evaluate_command_tests,
+    filter_excluded_files,
+    find_project_root,
+    get_python_files,
+    get_ratchet_path,
+)
+
+
+def get_root() -> str:
+    """Return the project root directory."""
+    return find_project_root()
+
+
+def get_config() -> Dict[str, Any]:
+    """Load and return the tests.toml configuration as a dict."""
+    root = get_root()
+    toml_path = Path(root) / "tests.toml"
+    try:
+        return toml.load(toml_path)
+    except Exception:
+        return {}
+
+
+def get_python_tests() -> Dict[str, Any]:
+    """Extract and return the 'python-tests' section from config."""
+    config = get_config()
+    return config.get("python-tests", {}) or {}
+
+
+def get_command_tests() -> Dict[str, Any]:
+    """Extract and return the 'custom-tests' section from config."""
+    config = get_config()
+    return config.get("custom-tests", {}) or {}
+
+
+def load_baseline_counts() -> Dict[str, int]:
+    """Load baseline counts from ratchet path, returning a dict of test_name to count."""
+    try:
+        ratchet_path: str = get_ratchet_path()
+        if os.path.isfile(ratchet_path):
+            with open(ratchet_path, 'r', encoding='utf-8') as f:
+                data = json.load(f)
+                if isinstance(data, dict):
+                    return {k: int(v) for k, v in data.items()}
+    except Exception:
+        pass
+    return {}
+
+
+def get_baseline_counts() -> Dict[str, int]:
+    """Return baseline counts, caching on first call."""
+    return load_baseline_counts()
+
+
+def get_filtered_files() -> List[Path]:
+    """Retrieve all Python files under the project, filtering excluded paths."""
+    root = get_root()
+    files: List[Path] = get_python_files(root)
+    excluded_path: str = os.path.join(root, "ratchet_excluded.txt")
+    ignore_path: str = os.path.join(root, ".gitignore")
+    try:
+        return filter_excluded_files(files, excluded_path, ignore_path)
+    except Exception:
+        return files
+
+
+def get_python_test_matches(test_name: str, rule: Dict[str, Any]) -> List[Dict[str, Any]]:
+    """Run the Python regex test for a single rule and return matches."""
+    files = get_filtered_files()
+    results: Dict[str, List[Dict[str, Any]]] = evaluate_python_tests(files, {test_name: rule})
+    return results.get(test_name, [])
+
+
+def get_command_test_matches(test_name: str, test_dict: Dict[str, Any]) -> List[Dict[str, Any]]:
+    """Run the custom command test for a single rule and return matches."""
+    files = get_filtered_files()
+    results: Dict[str, List[Dict[str, Any]]] = evaluate_command_tests(files, {test_name: test_dict})
+    return results.get(test_name, [])
+
+
+def check_python_rule(test_name: str, rule: Dict[str, Any]) -> None:
+    """Assert that current regex violations do not exceed baseline."""
+    matches = get_python_test_matches(test_name, rule)
+    current_count = len(matches)
+    baseline_counts = get_baseline_counts()
+    baseline_count = baseline_counts.get(test_name, 0)
+    if current_count > baseline_count:
+        details = "\n".join(
+            f"{r.get('file')}:{r.get('line')} — {r.get('content')}" for r in matches
+        )
+        raise AssertionError(
+            f"Regex violations for '{test_name}' increased: baseline={baseline_count}, current={current_count}\n" + details
+        )
+
+
+def check_command_rule(test_name: str, test_dict: Dict[str, Any]) -> None:
+    """Assert that current command violations do not exceed baseline."""
+    matches = get_command_test_matches(test_name, test_dict)
+    current_count = len(matches)
+    baseline_counts = get_baseline_counts()
+    baseline_count = baseline_counts.get(test_name, 0)
+    if current_count > baseline_count:
+        details = "\n".join(
+            f"{r.get('file')} — {r.get('content')}" for r in matches
+        )
+        raise AssertionError(
+            f"Command violations for '{test_name}' increased: baseline={baseline_count}, current={current_count}\n" + details
+        )
diff --git a/src/ratchets/run_tests.py b/src/ratchets/run_tests.py
@@ -0,0 +1,436 @@
+import os
+import threading
+import pathspec
+from datetime import datetime
+from pathlib import Path
+import toml
+import argparse
+import json
+import re
+import subprocess
+from typing import Optional, List, Dict, Tuple, Union, Any
+
+
+def print_diff(current_json: Dict[str, int], previous_json: Dict[str, int]) -> None:
+    all_keys = set(current_json.keys()) | set(previous_json.keys())
+    diff_count = 0
+    for key in sorted(all_keys):
+        current_value = current_json.get(key, 0)
+        previous_value = previous_json.get(key, 0)
+        if current_value != previous_value:
+            diff_count += 1
+            diff = current_value - previous_value
+            sign = "+" if diff > 0 else "-"
+            print(f"  {key}: {previous_value} → {current_value} ({sign}{abs(diff)})")
+    if diff_count == 0:
+        print("There are no differences.")
+
+
+def find_project_root(start_path: Optional[str] = None, markers: Optional[List[str]] = None) -> str:
+    if start_path is None:
+        start_path = os.getcwd()
+    if markers is None:
+        markers = ['.git', 'pyproject.toml', 'setup.py', 'tests.toml']
+    current = os.path.abspath(start_path)
+    while True:
+        for marker in markers:
+            if os.path.exists(os.path.join(current, marker)):
+                return current
+        parent = os.path.dirname(current)
+        if parent == current:
+            raise FileNotFoundError("Project root not found.")
+        current = parent
+
+
+def get_excludes_path() -> str:
+    DEFAULT_FILENAME = "ratchet_excluded.txt"
+    root = find_project_root(None)
+    return os.path.join(root, DEFAULT_FILENAME)
+
+
+def get_file_path(file: Optional[str]) -> str:
+    DEFAULT_FILENAME = "tests.toml"
+    if not file:
+        file = DEFAULT_FILENAME
+    if "/" in file:
+        return file
+    else:
+        root = find_project_root(file)
+        return os.path.join(root, file)
+
+
+def get_python_files(directory: Union[str, Path]) -> List[Path]:
+    directory = Path(directory)
+    python_files = set([path.absolute() for path in directory.rglob("*.py") if not path.is_symlink()])
+    return list(python_files)
+
+
+def filter_excluded_files(files: List[Path], excluded_path: str, ignore_path: str) -> List[Path]:
+    with open(excluded_path, 'r') as f:
+        patterns = f.read().splitlines()
+    if os.path.isfile(ignore_path):
+        with open(ignore_path, 'r') as f:
+            patterns += f.read().splitlines()
+    spec = pathspec.PathSpec.from_lines('gitwildmatch', patterns)
+    files = [f for f in files if not spec.match_file(f)]
+    return files
+
+
+def evaluate_tests(path: str, cmd_only: bool, regex_only: bool) -> Tuple[Dict[str, List[Dict[str, Any]]], Dict[str, List[Dict[str, Any]]]]:
+    assert os.path.isfile(path)
+    config = toml.load(path)
+    python_tests = config.get("python-tests")
+    custom_tests = config.get("custom-tests")
+    root = find_project_root()
+    files = get_python_files(root)
+    EXCLUDED_PATH = "ratchet_excluded.txt"
+    excluded_path = os.path.join(root, EXCLUDED_PATH)
+    ignore_path = os.path.join(root, ".gitignore")
+    files = filter_excluded_files(files, excluded_path, ignore_path)
+    test_issues: Dict[str, List[Dict[str, Any]]] = {}
+    custom_issues: Dict[str, List[Dict[str, Any]]] = {}
+    if python_tests and not cmd_only:
+        test_issues = evaluate_python_tests(files, python_tests)  # type: ignore
+    if custom_tests and not regex_only:
+        custom_issues = evaluate_command_tests(files, custom_tests)  # type: ignore
+    return test_issues, custom_issues
+
+
+def print_issues(issues: Dict[str, List[Dict[str, Any]]]) -> None:
+    for test_name, matches in issues.items():
+        if matches:
+            print(f"\n{test_name} — matched {len(matches)} issue(s):")
+            for match in matches:
+                file_path = match['file']
+                line = match.get('line')
+                content = match['content']
+                truncated = content if len(content) <= 80 else content[:80] + "..."
+                if line is not None:
+                    print(f"  → {file_path}:{line}: {truncated}")
+                else:
+                    print(f"  → {file_path}: {truncated}")
+        else:
+            print(f"\n{test_name} — no issues found.")
+
+
+def load_ratchet_results() -> Dict[str, Any]:
+    path = get_ratchet_path()
+    with open(path, 'r') as file:
+        data = json.load(file)
+    return data
+
+
+def evaluate_python_tests(files: List[Path], test_str: Dict[str, Dict[str, Any]]) -> Dict[str, List[Dict[str, Any]]]:
+    assert len(files) != 0
+    assert len(test_str) != 0
+
+    results: Dict[str, List[Dict[str, Any]]] = {}
+    threads = []
+    results_lock = threading.Lock()
+
+    def eval_thread(test_name: str, rule: Dict[str, Any]):
+        pattern = re.compile(rule["regex"])
+        matches = []
+
+        for file_path in files:
+            with open(file_path, 'r', encoding='utf-8') as f:
+                for lineno, line in enumerate(f, 1):
+                    if pattern.search(line):
+                        matches.append({
+                            "file": str(file_path),
+                            "line": lineno,
+                            "content": line.strip()
+                        })
+        with results_lock:
+            results[test_name] = matches
+
+    for test_name, rule in test_str.items():
+        thread = threading.Thread(target=eval_thread, args=(test_name, rule))
+        thread.start()
+        threads.append(thread)
+
+    for thread in threads:
+        thread.join()
+
+    return results
+
+
+def get_ratchet_path() -> str:
+    root = find_project_root()
+    RATCHET_NAME = "ratchet_values.json"
+    ratchet_file_path = os.path.join(root, RATCHET_NAME)
+    return ratchet_file_path
+
+
+def evaluate_command_tests(files: List[Path], test_str: Dict[str, Dict[str, Any]]) -> Dict[str, List[Dict[str, Any]]]:
+    assert len(test_str) != 0
+    assert len(files) != 0
+
+    results: Dict[str, List[Dict[str, Any]]] = {test_name: [] for test_name in test_str}
+    lock = threading.Lock()
+
+    def worker(test_name: str, command_template: str, file_path: str):
+        cmd_str = f"echo {file_path} | {command_template}"
+        try:
+            result = subprocess.run(
+                cmd_str,
+                shell=True,
+                text=True,
+                capture_output=True,
+                timeout=5
+            )
+            output = result.stdout.strip()
+            if output:
+                lines = output.splitlines()
+                with lock:
+                    for line in lines:
+                        results[test_name].append({
+                            "file": file_path,
+                            "line": None,
+                            "content": line.strip()
+                        })
+        except subprocess.TimeoutExpired:
+            print(f"Timeout while running test '{test_name}' on {file_path}")
+
+    threads = []
+
+    for test_name, test_dict in test_str.items():
+        command_template = test_dict["command"]
+        for file_path in files:
+            t = threading.Thread(target=worker, args=(test_name, command_template, file_path))
+            t.start()
+            threads.append(t)
+
+    for t in threads:
+        t.join()
+
+    return results
+
+
+def results_to_json(results: Tuple[Dict[str, List[Dict[str, Any]]], Dict[str, List[Dict[str, Any]]]]) -> str:
+    test_issues, custom_issues = results
+    counts: Dict[str, int] = {}
+    for name, matches in test_issues.items():
+        counts[name] = len(matches)
+    for name, matches in custom_issues.items():
+        counts[name] = counts.get(name, 0) + len(matches)
+    return json.dumps(counts, indent=2, sort_keys=True)
+
+
+def update_ratchets(test_path: str, cmd_mode: bool, regex_mode: bool) -> None:
+    results = evaluate_tests(test_path, cmd_mode, regex_mode)
+    results_json = results_to_json(results)
+    path = get_ratchet_path()
+    with open(path, 'w') as file:
+        file.writelines(results_json)
+
+
+def print_issues_with_blames(results: Tuple[Dict[str, List[Dict[str, Any]]], Dict[str, List[Dict[str, Any]]]], max_count: int) -> None:
+    enriched_test_issues, enriched_custom_issues = add_blames(results)
+
+    def _parse_time(ts: Optional[str]) -> datetime:
+        if not ts:
+            return datetime.max
+        try:
+            return datetime.fromisoformat(ts)
+        except Exception:
+            return datetime.max
+
+    def _print_section(section_name: str, issues_dict: Dict[str, List[Dict[str, Any]]]) -> None:
+        for test_name, matches in issues_dict.items():
+            if matches:
+                sorted_matches = sorted(matches, key=lambda m: _parse_time(m.get("blame_time")))  # type: ignore
+                print("\n" + "-" * 40)
+                print(f"{section_name} — {test_name} ({len(sorted_matches)} issue{'s' if len(sorted_matches) != 1 else ''}):")
+                print("-" * 40)
+                count = 0
+                for match in sorted_matches:
+                    count += 1
+                    if count > max_count:
+                        break
+                    file_path = match.get("file", "<unknown>")
+                    line_no = match.get("line")
+                    content = match.get("content", "").strip()
+                    truncated = content if len(content) <= 80 else content[:80] + "..."
+                    author = match.get("blame_author") or "Unknown"
+                    ts = match.get("blame_time") or "Unknown"
+                    if line_no is not None:
+                        print(f"  → {file_path}:{line_no}  by {author} at {ts}")
+                        print(f"       {truncated}")
+                    else:
+                        print(f"  → {file_path}  by {author} at {ts}")
+                        print(f"       {truncated}")
+            else:
+                print(f"\n{section_name} — {test_name}: no issues found.")
+
+    _print_section("Regex Test", enriched_test_issues)
+    _print_section("Command Test", enriched_custom_issues)
+
+
+def add_blames(results: Tuple[Dict[str, List[Dict[str, Any]]], Dict[str, List[Dict[str, Any]]]]) -> Tuple[Dict[str, List[Dict[str, Any]]], Dict[str, List[Dict[str, Any]]]]:
+    test_issues, custom_issues = results
+    try:
+        repo_root: Optional[str] = find_project_root()
+    except Exception:
+        repo_root = None
+
+    def get_blame_for_line(file_path: str, line_no: Optional[int]) -> Tuple[Optional[str], Optional[str]]:
+        if repo_root is None:
+            return None, None
+        cmd = ["git", "blame", "-L", f"{line_no},{line_no}", "--porcelain", file_path]
+        try:
+            res = subprocess.run(cmd, capture_output=True, text=True, cwd=repo_root, timeout=5)
+            if res.returncode != 0:
+                return None, None
+            author: Optional[str] = None
+            author_time: Optional[str] = None
+            for l in res.stdout.splitlines():
+                if l.startswith("author "):
+                    author = l[len("author "):].strip()
+                elif l.startswith("author-time "):
+                    try:
+                        ts = int(l[len("author-time "):].strip())
+                        author_time = datetime.fromtimestamp(ts).isoformat()
+                    except Exception:
+                        author_time = None
+                if author is not None and author_time is not None:
+                    break
+            return author, author_time
+        except Exception:
+            return None, None
+
+    def get_last_commit_for_file(file_path: str) -> Tuple[Optional[str], Optional[str]]:
+        if repo_root is None:
+            return None, None
+        cmd = ["git", "log", "-1", "--format=%an;%at", "--", file_path]
+        try:
+            res = subprocess.run(cmd, capture_output=True, text=True, cwd=repo_root, timeout=5)
+            if res.returncode != 0 or not res.stdout.strip():
+                return None, None
+            out = res.stdout.strip()
+            parts = out.split(";", 1)
+            if len(parts) != 2:
+                return None, None
+            author = parts[0].strip()
+            try:
+                ts = int(parts[1].strip())
+                author_time = datetime.fromtimestamp(ts).isoformat()
+            except Exception:
+                author_time = None
+            return author, author_time
+        except Exception:
+            return None, None
+
+    for issues in (test_issues, custom_issues):
+        for test_name, matches in issues.items():
+            for match in matches:
+                file_path = match.get("file")
+                line_no = match.get("line")
+                if not file_path:
+                    continue
+                if line_no is not None:
+                    author, author_time = get_blame_for_line(file_path, line_no)
+                else:
+                    author, author_time = get_last_commit_for_file(file_path)
+                match["blame_author"] = author if author is not None else None
+                match["blame_time"] = author_time if author_time is not None else None
+
+    return test_issues, custom_issues
+
+
+
+
+def cli():
+    parser = argparse.ArgumentParser(description="Python ratchet testing")
+
+    # Input file
+    parser.add_argument("-f", "--file", help="specify .toml file with tests")
+
+    # Filtering modes
+    parser.add_argument(
+        "-c", "--command-only",
+        action="store_true",
+        help="run only custom command-based tests"
+    )
+    parser.add_argument(
+        "-r", "--regex-only",
+        action="store_true",
+        help="run only regex-based tests"
+    )
+
+    # Output formatting
+    parser.add_argument(
+        "-v", "--verbose",
+        action="store_true",
+        help="run verbose tests, printing each infringing line"
+    )
+
+    # Blame and related
+    parser.add_argument(
+        "-b", "--blame",
+        action="store_true",
+        help="run an additional git-blame for each infraction, ordering results by timestamp"
+    )
+    parser.add_argument(
+        "-m", "--max-count",
+        type=int,
+        help="maximum infractions to display per test (only applies with --blame; default is 10)"
+    )
+
+    # Modes of operation
+    parser.add_argument(
+        "--compare-counts",
+        action="store_true",
+        help="show only the differences in infraction counts between the current and last saved tests"
+    )
+    parser.add_argument(
+        "-u", "--update-ratchets",
+        action="store_true",
+        help="update ratchets_values.json"
+    )
+    
+    args = parser.parse_args()
+    file: Optional[str] = args.file
+    cmd_mode: bool = args.command_only
+    regex_mode: bool = args.regex_only
+    update: bool = args.update_ratchets
+    compare_counts: bool = args.compare_counts
+    blame: bool = args.blame
+    verbose: bool = args.verbose
+    max_count: Optional[int] = args.max_count
+
+    if not max_count:
+        max_count = 10
+    test_path = get_file_path(file)
+
+    # Probably should enforce only
+    # one can be selected via an error on
+    # the CLI instead of functionally 
+    # defining a hierarchy.
+
+    if blame:
+        issues = evaluate_tests(test_path, cmd_mode, regex_mode)
+        with_blames = add_blames(issues)
+        print_issues_with_blames(issues, max_count)
+    elif compare_counts:
+        issues = evaluate_tests(test_path, cmd_mode, regex_mode)
+        current_json = json.loads(results_to_json(issues))
+        previous_json = load_ratchet_results()
+        print_diff(current_json, previous_json)
+    elif update:
+        update_ratchets(test_path, cmd_mode, regex_mode)
+    elif verbose:
+        issues = evaluate_tests(test_path, cmd_mode, regex_mode)
+        for issue_type in issues:
+            print_issues(issue_type)
+    else:
+        issues = evaluate_tests(test_path, cmd_mode, regex_mode)
+        current_json = json.loads(results_to_json(issues))
+        print("Current " + str(current_json))
+        previous_json = load_ratchet_results()
+        print("Previous: " + str(previous_json))
+        print("Diffs:")
+        print_diff(current_json, previous_json)
+
+if __name__ == "__main__":
+    cli()
diff --git a/src/ratchets/test_ratchet.py b/src/ratchets/test_ratchet.py
@@ -0,0 +1,34 @@
+import pytest
+from abstracted_tests import get_python_tests, get_command_tests, check_python_rule, check_command_rule
+
+@pytest.mark.parametrize("test_name,rule", get_python_tests().items())
+def test_python_regex_rule(test_name: str, rule: dict) -> None:
+    check_python_rule(test_name, rule)
+
+@pytest.mark.parametrize("test_name,test_dict", get_command_tests().items())
+def test_custom_command_rule(test_name: str, test_dict: dict) -> None:
+    check_command_rule(test_name, test_dict)
+
+    # def test_all_python_regex_rules():
+    #     errors = []
+    #     for test_name, rule in get_python_tests().items():
+    #         try:
+    #             check_python_rule(test_name, rule)
+    #         except AssertionError as e:
+    #             errors.append(f"{test_name}: {e}")
+    #         except Exception as e:
+    #             errors.append(f"{test_name}: unexpected error: {e!r}")
+    #     if errors:
+    #         pytest.fail("Some python regex rules failed:\n" + "\n".join(errors))
+    # 
+    # def test_all_command_rules():
+    #     errors = []
+    #     for test_name, test_dict in get_command_tests().items():
+    #         try:
+    #             check_command_rule(test_name, test_dict)
+    #         except AssertionError as e:
+    #             errors.append(f"{test_name}: {e}")
+    #         except Exception as e:
+    #             errors.append(f"{test_name}: unexpected error: {e!r}")
+    #     if errors:
+    #         pytest.fail("Some command rules failed:\n" + "\n".join(errors))
diff --git a/src/ratchets/validate.py b/src/ratchets/validate.py
@@ -0,0 +1,55 @@
+import run_tests
+import re
+import toml
+import argparse
+from typing import Dict, Any, Optional
+
+def evaluate_single_regex(regex: str, custom_str: str) -> Optional[re.Match[str]]:
+    pattern = re.compile(regex)
+    return pattern.search(custom_str)
+
+def check_valid(python_tests: Dict[str, Dict[str, Any]]) -> None:
+    for test in python_tests:
+        regex: str = python_tests[test]["regex"]
+        for validation in python_tests[test]["valid"]:
+            for line in validation.splitlines():
+                if evaluate_single_regex(regex, line):
+                    raise AssertionError(f"Regex: {regex} matched {line}")
+
+def check_invalid(python_tests: Dict[str, Dict[str, Any]]) -> int:
+    for test in python_tests:
+        regex: str = python_tests[test]["regex"]
+        for validation in python_tests[test]["invalid"]:
+            found: bool = False
+            for line in validation.splitlines():
+                if evaluate_single_regex(regex, line):
+                    found = True
+            if not found:
+                raise AssertionError(f"Regex: {regex} not matched in {validation}")
+    return 0
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(description="Python ratchet testing")
+    parser.add_argument("-f", "--file")
+    args = parser.parse_args()
+    file: Optional[str] = args.file
+    test_path: str = run_tests.get_file_path(file)
+    config: Dict[str, Any] = toml.load(test_path)
+    python_tests: Optional[Dict[str, Dict[str, Any]]] = config.get("python-tests")
+
+    if python_tests is None:
+        print("No python tests found, there is nothing to validate.")
+        exit()
+
+    check_valid(python_tests)
+    check_invalid(python_tests)
+
+    print(f"All expected regex invalid/valid samples are correct for:\n{test_path}")
+
+
+
+
+
+
+
+
diff --git a/src/run_tests.py b/src/run_tests.py
@@ -1,445 +0,0 @@
-import os
-import pathspec
-from datetime import datetime
-from pathlib import Path
-import toml
-import argparse
-import json
-import re
-import subprocess
-
-def print_diff(current_json, previous_json):
-    all_keys = set(current_json.keys()) | set(previous_json.keys())
-
-    diff_count = 0
-
-    for key in sorted(all_keys):
-        current_value = current_json.get(key, 0)
-        previous_value = previous_json.get(key, 0)
-
-        if current_value != previous_value:
-            diff_count += 1
-            diff = current_value - previous_value
-            sign = "+" if diff > 0 else "-"
-            print(f"  {key}: {previous_value} → {current_value} ({sign}{abs(diff)})")
-    
-    if diff_count == 0:
-        print("There are no differences.")
-
-def find_project_root(start_path=None, markers=None):
-    if start_path is None:
-        start_path = os.getcwd()
-    if markers is None:
-        markers = ['.git', 'pyproject.toml', 'setup.py', 'tests.toml']
-
-    current = os.path.abspath(start_path)
-    while True:
-        for marker in markers:
-            if os.path.exists(os.path.join(current, marker)):
-                return current
-        parent = os.path.dirname(current)
-        if parent == current:
-            raise FileNotFoundError("Project root not found.")
-        current = parent
-
-
-def get_excludes_path():
-    DEFAULT_FILENAME = "ratchet_excluded.txt"
-    root = find_project_root(file)
-    return os.path.join(root, DEFAULT_FILENAME)
-
-
-def get_file_path(file):
-
-    DEFAULT_FILENAME = "tests.toml"
-
-    if not file:
-        file = DEFAULT_FILENAME
-
-    if "/" in file:
-        return file
-    else:
-        root = find_project_root(file)
-        return os.path.join(root, file)
-
-def get_python_files(directory):
-    directory = Path(directory)
-    python_files = set([path.absolute() for path in directory.rglob("*.py") if not path.is_symlink()])
-    return list(python_files)
-
-def filter_excluded_files(files, excluded_path, ignore_path):
-    with open(excluded_path, 'r') as f:
-        patterns = f.read().splitlines()
-
-    if os.path.isfile(ignore_path):
-        with open(ignore_path, 'r') as f:
-            patterns += f.read().splitlines()
-
-    spec = pathspec.PathSpec.from_lines('gitwildmatch', patterns)
-
-    files = [f for f in files if not spec.match_file(f)]
-
-    return files
-
-def evaluate_tests(path, cmd_only, regex_only):
-
-    assert (os.path.isfile(path))
-
-    config = toml.load(path)
-    python_tests = config.get("python-tests")
-    custom_tests = config.get("custom-tests")
-    root = find_project_root()
-
-    files = get_python_files(root)
-
-    EXCLUDED_PATH = "ratchet_excluded.txt"
-    excluded_path = os.path.join(root, EXCLUDED_PATH)
-
-    ignore_path = os.path.join(root, ".gitignore")
-
-    files = filter_excluded_files(files, excluded_path, ignore_path)
-
-    test_issues = {}
-    custom_issues = {}
-
-    if python_tests and not cmd_only:
-        test_issues = evaluate_python_tests(files, python_tests)
-
-    if custom_tests and not regex_only:
-        custom_issues = evaluate_command_tests(files, custom_tests)
-
-    return (test_issues, custom_issues)
-
-def print_issues(issues):
-    for test_name, matches in issues.items():
-        if matches:
-            print(f"\n{test_name} — matched {len(matches)} issue(s):")
-            for match in matches:
-                file = match['file']
-                line = match.get('line')
-                content = match['content']
-                truncated = content if len(content) <= 80 else content[:80] + "..."
-                if line is not None:
-                    print(f"  → {file}:{line}: {truncated}")
-                else:
-                    print(f"  → {file}: {truncated}")
-        else:
-            print(f"\n{test_name} — no issues found.")
-
-
-def load_ratchet_results():
-    path = get_ratchet_path()
-    with open(path, 'r') as file:
-        data = json.load(file)
-    return data
-    
-
-def evaluate_python_tests(files, test_str):
-    assert len(files) != 0
-    assert len(test_str) != 0
-
-    results = {}
-
-    for test_name, rule in test_str.items():
-        pattern = re.compile(rule["regex"])
-        results[test_name] = []
-
-        for file_path in files:
-            with open(file_path, 'r', encoding='utf-8') as f:
-                for lineno, line in enumerate(f, 1):
-                    if pattern.search(line):
-                        results[test_name].append({
-                            "file": str(file_path),
-                            "line": lineno,
-                            "content": line.strip()
-                        })
-
-    return results
-    
-def get_ratchet_path():
-    root = find_project_root()
-    RATCHET_NAME = "ratchet_values.json"
-    ratchet_file_path = os.path.join(root, RATCHET_NAME)
-    return ratchet_file_path
-
-
-def evaluate_command_tests(files, test_str):
-    assert len(test_str) != 0
-    assert len(files) != 0
-
-    results = {}
-
-    for test_name, test_dict in test_str.items():
-        command_template = test_dict["command"]
-        results[test_name] = []
-
-        for file in files:
-            cmd_str = f"echo {file} | {command_template}"
-
-            try:
-                result = subprocess.run(
-                    cmd_str,
-                    shell=True,
-                    text=True,
-                    capture_output=True,
-                    timeout=5
-                )
-
-                output = result.stdout.strip()
-                if output:
-                    lines = output.splitlines()
-                    for line in lines:
-                        results[test_name].append({
-                            "file": str(file),
-                            "line": None,
-                            "content": line.strip()
-                        })
-
-            except subprocess.TimeoutExpired:
-                print(f"Timeout while running test '{test_name}' on {file}")
-    return results
-
-def results_to_json(results):
-
-    test_issues, custom_issues = results
-    counts = {}
-
-    for name, matches in test_issues.items():
-        counts[name] = len(matches)
-
-    for name, matches in custom_issues.items():
-        counts[name] = counts.get(name, 0) + len(matches)
-
-    return json.dumps(counts, indent=2, sort_keys=True)
-
-def update_ratchets(test_path, cmd_mode, regex_mode):
-    results = evaluate_tests(test_path, cmd_mode, regex_mode)
-    results_json = results_to_json(results)
-    path = get_ratchet_path()
-    with open(path, 'w') as file:
-        file.writelines(results_json)
-
-
-
-from datetime import datetime
-
-def print_issues_with_blames(results, max_count):
-    enriched_test_issues, enriched_custom_issues = add_blames(results)
-
-    def _parse_time(ts):
-        if not ts:
-            return datetime.max
-        try:
-            return datetime.fromisoformat(ts)
-        except Exception:
-            return datetime.max
-
-    def _print_section(section_name, issues_dict):
-        for test_name, matches in issues_dict.items():
-            if matches:
-                sorted_matches = sorted(matches, key=lambda m: _parse_time(m.get("blame_time")))
-                print("\n" + "-"*40)
-                print(f"{section_name} — {test_name} ({len(sorted_matches)} issue{'s' if len(sorted_matches)!=1 else ''}):")
-                print("-"*40)
-                count = 0
-                for match in sorted_matches:
-                    count += 1
-                    if count > max_count:
-                        break
-                    file_path = match.get("file", "<unknown>")
-                    line_no = match.get("line")
-                    content = match.get("content", "").strip()
-                    truncated = content if len(content) <= 80 else content[:80] + "..."
-                    author = match.get("blame_author") or "Unknown"
-                    ts = match.get("blame_time") or "Unknown"
-                    if line_no is not None:
-                        print(f"  → {file_path}:{line_no}  by {author} at {ts}")
-                        print(f"       {truncated}")
-                    else:
-                        print(f"  → {file_path}  by {author} at {ts}")
-                        print(f"       {truncated}")
-            else:
-                # No matches for this test
-                print(f"\n{section_name} — {test_name}: no issues found.")
-
-    _print_section("Regex Test", enriched_test_issues)
-    _print_section("Command Test", enriched_custom_issues)
-
-def add_blames(results):
-
-    test_issues, custom_issues = results
-
-    # Determine repo root to run git commands in
-    try:
-        repo_root = find_project_root()
-    except Exception:
-        repo_root = None  # if not in a git repo, blame will fail
-
-    def get_blame_for_line(file_path, line_no):
-        """
-        Returns (author, timestamp_iso) for a given file and line number via git blame.
-        If anything fails, returns (None, None).
-        """
-        if repo_root is None:
-            return None, None
-        # Use porcelain format for easier parsing
-        cmd = ["git", "blame", "-L", f"{line_no},{line_no}", "--porcelain", file_path]
-        try:
-            res = subprocess.run(cmd, capture_output=True, text=True, cwd=repo_root, timeout=5)
-            if res.returncode != 0:
-                return None, None
-            author = None
-            author_time = None
-            for l in res.stdout.splitlines():
-                if l.startswith("author "):
-                    author = l[len("author "):].strip()
-                elif l.startswith("author-time "):
-                    # author-time is a Unix timestamp (seconds since epoch)
-                    try:
-                        ts = int(l[len("author-time "):].strip())
-                        # convert to ISO 8601; uses local timezone
-                        author_time = datetime.fromtimestamp(ts).isoformat()
-                    except Exception:
-                        author_time = None
-                # once we have both, we can break
-                if author is not None and author_time is not None:
-                    break
-            return author, author_time
-        except Exception:
-            return None, None
-
-    def get_last_commit_for_file(file_path):
-        """
-        Returns (author, timestamp_iso) for the last commit touching this file via git log.
-        If fails, returns (None, None).
-        """
-        if repo_root is None:
-            return None, None
-        cmd = ["git", "log", "-1", "--format=%an;%at", "--", file_path]
-        try:
-            res = subprocess.run(cmd, capture_output=True, text=True, cwd=repo_root, timeout=5)
-            if res.returncode != 0 or not res.stdout.strip():
-                return None, None
-            out = res.stdout.strip()
-            # format is "Author Name;timestamp"
-            parts = out.split(";", 1)
-            if len(parts) != 2:
-                return None, None
-            author = parts[0].strip()
-            try:
-                ts = int(parts[1].strip())
-                author_time = datetime.fromtimestamp(ts).isoformat()
-            except Exception:
-                author_time = None
-            return author, author_time
-        except Exception:
-            return None, None
-
-    # Process both test_issues and custom_issues
-    for issues in (test_issues, custom_issues):
-        for test_name, matches in issues.items():
-            for match in matches:
-                file_path = match.get("file")
-                line_no = match.get("line")
-                # Only proceed if file_path exists
-                if not file_path:
-                    continue
-                # If it's an absolute path, convert to relative to repo_root if possible
-                # Git commands accept absolute paths if cwd is repo root, so this is OK.
-                if line_no is not None:
-                    # try blame for the specific line
-                    author, author_time = get_blame_for_line(file_path, line_no)
-                else:
-                    # fallback to last commit touching file
-                    author, author_time = get_last_commit_for_file(file_path)
-                # Attach blame info if found
-                if author is not None:
-                    match["blame_author"] = author
-                else:
-                    match["blame_author"] = None
-                if author_time is not None:
-                    match["blame_time"] = author_time
-                else:
-                    match["blame_time"] = None
-
-    return (test_issues, custom_issues)
-
-if __name__ == "__main__":
-
-    parser = argparse.ArgumentParser(description="Python ratchet testing")
-    parser.add_argument("-f", "--file", help="Specify .toml file with tests")
-
-    parser.add_argument(
-        "-b", "--blame",
-        action="store_true",
-        help="Run only custom command-based tests"
-    )
-
-    parser.add_argument(
-        "--max-count", "-m",
-        type=int,
-        default=None,
-        help="Maximum infractions to display per test (only applies with --blame; default is 10)"
-    )
-
-    parser.add_argument(
-        "-c", "--command-only",
-        action="store_true",
-        help="Run only custom command-based tests"
-    )
-
-
-    parser.add_argument(
-        "--compare-counts",
-        action="store_true",
-        help="Compare the counts between the current test and the last saved"
-    )
-
-    parser.add_argument(
-        "-r", "--regex-only",
-        action="store_true",
-        help="Run only regex-based tests"
-    )
-
-    parser.add_argument(
-        "-u", "--update-ratchets",
-        action="store_true",
-        help="Update ratchets_values.json"
-    )
-
-    args = parser.parse_args()
-    file = args.file
-
-    cmd_mode = args.command_only
-    regex_mode = args.regex_only
-    update = args.update_ratchets
-    compare_counts = args.compare_counts
-    blame = args.blame
-    max_count = args.max_count
-
-    if not max_count:
-        max_count = 10
-
-    test_path = get_file_path(file)
-
-    if blame:
-        issues = evaluate_tests(test_path, cmd_mode, regex_mode)
-        with_blames = add_blames(issues)
-        print_issues_with_blames(issues, max_count)
-
-    else:
-        if compare_counts:
-            issues = evaluate_tests(test_path, cmd_mode, regex_mode)
-
-            current_json = json.loads(results_to_json(issues))
-            previous_json = load_ratchet_results()
-
-            print_diff(current_json, previous_json)
-
-        else:
-            if update:
-                update_ratchets(test_path, cmd_mode, regex_mode)
-            else:
-                issues = evaluate_tests(test_path, cmd_mode, regex_mode)
-                for issue_type in issues:
-                    print_issues(issue_type)
diff --git a/src/test_ratchet.py b/src/test_ratchet.py
@@ -1,101 +0,0 @@
-import os
-import json
-import pytest
-import toml
-from pathlib import Path
-from run_tests import (
-    evaluate_python_tests,
-    evaluate_command_tests,
-    filter_excluded_files,
-    find_project_root,
-    get_python_files,
-    get_ratchet_path
-)
-
-ROOT = find_project_root()
-TOML_PATH = Path(ROOT) / "tests.toml"
-CONFIG = toml.load(TOML_PATH)
-
-PYTHON_TESTS = CONFIG.get("python-tests", {})
-COMMAND_TESTS = CONFIG.get("custom-tests", {})
-
-def load_baseline_counts():
-    """
-    Load previous counts from ratchet_values.json.
-    Return a dict mapping test_name -> count. If file missing or malformed, return empty dict.
-    """
-    try:
-        ratchet_path = get_ratchet_path()
-        if os.path.isfile(ratchet_path):
-            with open(ratchet_path, 'r', encoding='utf-8') as f:
-                data = json.load(f)
-                if isinstance(data, dict):
-                    # Ensure values are ints
-                    return {k: int(v) for k, v in data.items()}
-    except Exception:
-        pass
-    return {}
-
-BASELINE_COUNTS = load_baseline_counts()
-
-@pytest.mark.parametrize("test_name,rule", PYTHON_TESTS.items())
-def test_python_regex_rule(test_name, rule):
-    # Prepare file list
-    root = find_project_root()
-    files = get_python_files(root)
-    EXCLUDED_PATH = "ratchet_excluded.txt"
-    excluded_path = os.path.join(root, EXCLUDED_PATH)
-    ignore_path = os.path.join(root, ".gitignore")
-    files = filter_excluded_files(files, excluded_path, ignore_path)
-
-    # Evaluate current results
-    results = evaluate_python_tests(files, {test_name: rule})
-    current_matches = results.get(test_name, [])
-    current_count = len(current_matches)
-
-    # Baseline
-    baseline_count = BASELINE_COUNTS.get(test_name, 0)
-
-    # If increased, fail.
-    assert current_count <= baseline_count, (
-        f"Regex violations for '{test_name}' increased: "
-        f"baseline={baseline_count}, current={current_count}\n"
-        + (
-            "\n".join(
-                f"{r['file']}:{r['line']} — {r['content']}"
-                for r in current_matches
-            )
-          if current_count > 0 else ""
-        )
-    )
-
-@pytest.mark.parametrize("test_name,test_dict", COMMAND_TESTS.items())
-def test_custom_command_rule(test_name, test_dict):
-    # Prepare file list
-    root = find_project_root()
-    files = get_python_files(root)
-    EXCLUDED_PATH = "ratchet_excluded.txt"
-    excluded_path = os.path.join(root, EXCLUDED_PATH)
-    ignore_path = os.path.join(root, ".gitignore")
-    files = filter_excluded_files(files, excluded_path, ignore_path)
-
-    # Evaluate current results
-    results = evaluate_command_tests(files, {test_name: test_dict})
-    current_matches = results.get(test_name, [])
-    current_count = len(current_matches)
-
-    # Baseline
-    baseline_count = BASELINE_COUNTS.get(test_name, 0)
-
-    # If increased, fail.
-    assert current_count <= baseline_count, (
-        f"Command violations for '{test_name}' increased: "
-        f"baseline={baseline_count}, current={current_count}\n"
-        + (
-            "\n".join(
-                f"{r['file']} — {r['content']}"
-                for r in current_matches
-            )
-          if current_count > 0 else ""
-        )
-    )
diff --git a/src/validate.py b/src/validate.py
@@ -1,56 +0,0 @@
-import run_tests
-import re
-import toml
-import argparse
-
-# validate rules
-def evaluate_single_regex(regex, custom_str):
-    pattern = re.compile(regex)
-    return pattern.search(custom_str)
-
-def check_valid(python_tests):
-    for test in python_tests:
-        regex = python_tests[test]["regex"]
-        for validation in python_tests[test]["valid"]:
-            for line in validation.splitlines():
-                if evaluate_single_regex(regex, line):
-                    raise AssertionError(f"Regex: {regex} matched {line}")
-
-
-def check_invalid(python_tests):
-
-    for test in python_tests:
-        regex = python_tests[test]["regex"]
-        for validation in python_tests[test]["invalid"]:
-
-            found = False
-
-            for line in validation.splitlines():
-                if evaluate_single_regex(regex, line):
-                    found = True
-            
-            if not found:
-                raise AssertionError(f"Regex: {regex} not matched in {validation}")
-    return 0
-
-if __name__ == "__main__":
-
-    parser = argparse.ArgumentParser(description="Python ratchet testing")
-    parser.add_argument("-f", "--file",)
-
-    args = parser.parse_args()
-    file = args.file
-
-    test_path = run_tests.get_file_path(file)
-
-    config = toml.load(test_path)
-    python_tests = config.get("python-tests")
-
-    if python_tests is None:
-        print("No python tests found, there is nothing to validate.")
-        exit()
-
-    check_valid(python_tests)
-    check_invalid(python_tests)
-
-    print(f"All expected regex invalid/valid samples are correct for:\n{test_path}")

	ratchets Unnamed repository; edit this file 'description' to name the repository.
	Log \| Files \| Refs \| README \| LICENSE

M	.gitignore	\|	3	++-
A	src/ratchets/__init__.py	\|	0
A	src/ratchets/__main__.py	\|	3	+++
A	src/ratchets/abstracted_tests.py	\|	116	+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
A	src/ratchets/run_tests.py	\|	436	+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
A	src/ratchets/test_ratchet.py	\|	34	++++++++++++++++++++++++++++++++++
A	src/ratchets/validate.py	\|	55	+++++++++++++++++++++++++++++++++++++++++++++++++++++++
D	src/run_tests.py	\|	445	-------------------------------------------------------------------------------
D	src/test_ratchet.py	\|	101	-------------------------------------------------------------------------------
D	src/validate.py	\|	56	--------------------------------------------------------