codeflash-ai · KRRT7 · Dec 12, 2025 · Dec 12, 2025 · Dec 12, 2025 · Dec 12, 2025
diff --git a/codeflash/api/aiservice.py b/codeflash/api/aiservice.py
@@ -6,6 +6,7 @@
 import time
 from typing import TYPE_CHECKING, Any, cast
 
+import git
 import requests
 from pydantic.json import pydantic_encoder
 
@@ -637,7 +638,14 @@ def get_aiservice_base_url(self) -> str:
 def safe_get_repo_owner_and_name() -> tuple[str | None, str | None]:
     try:
         git_repo_owner, git_repo_name = get_repo_owner_and_name()
+    except (ValueError, git.exc.InvalidGitRepositoryError):
+        # Expected errors when:
+        # - No remotes are configured (e.g., local-only repos) -> ValueError
+        # - Not in a git repository -> InvalidGitRepositoryError
+        # These are normal and shouldn't be logged as warnings
+        git_repo_owner, git_repo_name = None, None
     except Exception as e:
+        # Unexpected errors should still be logged
         logger.warning(f"Could not determine repo owner and name: {e}")
         git_repo_owner, git_repo_name = None, None
     return git_repo_owner, git_repo_name
diff --git a/codeflash/cli_cmds/cli.py b/codeflash/cli_cmds/cli.py
@@ -143,8 +143,15 @@ def process_and_validate_cmd_args(args: Namespace) -> Namespace:
             exit_with_message(f"File {args.file} does not exist", error_on_exit=True)
         args.file = Path(args.file).resolve()
         if not args.no_pr:
-            owner, repo = get_repo_owner_and_name()
-            require_github_app_or_exit(owner, repo)
+            try:
+                owner, repo = get_repo_owner_and_name()
+                require_github_app_or_exit(owner, repo)
+            except ValueError as e:
+                exit_with_message(
+                    f"Cannot determine repository information: {e}\n"
+                    f"Please ensure your git repository has a remote configured, or use '--no-pr' to optimize locally.",
+                    error_on_exit=True,
+                )
     if args.replay_test:
         for test_path in args.replay_test:
             if not Path(test_path).is_file():
@@ -265,9 +272,19 @@ def handle_optimize_all_arg_parsing(args: Namespace) -> Namespace:
                 apologize_and_exit()
             git_remote = getattr(args, "git_remote", None)
             if not check_and_push_branch(git_repo, git_remote=git_remote):
-                exit_with_message("Branch is not pushed...", error_on_exit=True)
-            owner, repo = get_repo_owner_and_name(git_repo)
-            require_github_app_or_exit(owner, repo)
+                exit_with_message(
+                    "Cannot proceed without a valid git remote configuration. See error message above.",
+                    error_on_exit=True,
+                )
+            try:
+                owner, repo = get_repo_owner_and_name(git_repo)
+                require_github_app_or_exit(owner, repo)
+            except ValueError as e:
+                exit_with_message(
+                    f"Cannot determine repository information: {e}\n"
+                    f"Please ensure your git repository has a remote configured, or use '--no-pr' to optimize locally.",
+                    error_on_exit=True,
+                )
     if not hasattr(args, "all"):
         args.all = None
     elif args.all == "":

diff --git a/codeflash/code_utils/git_utils.py b/codeflash/code_utils/git_utils.py
@@ -80,6 +80,12 @@ def get_current_branch(repo: Repo | None = None) -> str:
 
 def get_remote_url(repo: Repo | None = None, git_remote: str | None = "origin") -> str:
     repository: Repo = repo if repo else git.Repo(search_parent_directories=True)
+    available_remotes = get_git_remotes(repository)
+    if not available_remotes:
+        raise ValueError("No git remotes configured in this repository")
+    if git_remote not in available_remotes:
+        msg = f"Git remote '{git_remote}' does not exist. Available remotes: {', '.join(available_remotes)}"
+        raise ValueError(msg)
     return repository.remote(name=git_remote).url
 
 
@@ -128,6 +134,30 @@ def confirm_proceeding_with_no_git_repo() -> str | bool:
 def check_and_push_branch(repo: git.Repo, git_remote: str | None = "origin", *, wait_for_push: bool = False) -> bool:
     current_branch = repo.active_branch
     current_branch_name = current_branch.name
+    available_remotes = get_git_remotes(repo)
+    if not available_remotes:
+        logger.error(
+            f"❌ No git remotes configured in this repository.\n"
+            f"This appears to be a local-only git repository. To use codeflash with PR features, you need to:\n"
+            f"  1. Create a repository on GitHub (or another git hosting service)\n"
+            f"  2. Add it as a remote: git remote add origin <repository-url>\n"
+            f"  3. Push your branch: git push -u origin {current_branch_name}\n\n"
+            f"Alternatively, you can run codeflash with the '--no-pr' flag to optimize locally without creating PRs."
+        )
+        return False
+
+    # Check if the specified remote exists
+    if git_remote not in available_remotes:
+        logger.error(
+            f"❌ Git remote '{git_remote}' does not exist in this repository.\n"
+            f"Available remotes: {', '.join(available_remotes)}\n\n"
+            f"You can either:\n"
+            f"  1. Use one of the existing remotes by setting 'git-remote' in pyproject.toml\n"
+            f"  2. Add the '{git_remote}' remote: git remote add {git_remote} <repository-url>\n"
+            f"  3. Run codeflash with '--no-pr' to optimize locally without creating PRs."
+        )
+        return False
+
     remote = repo.remote(name=git_remote)
 
     # Check if the branch is pushed

diff --git a/codeflash/discovery/functions_to_optimize.py b/codeflash/discovery/functions_to_optimize.py
@@ -598,8 +598,8 @@ def was_function_previously_optimized(
     # already_optimized_count = 0
     try:
         owner, repo = get_repo_owner_and_name()
-    except git.exc.InvalidGitRepositoryError:
-        logger.warning("No git repository found")
+    except (git.exc.InvalidGitRepositoryError, ValueError) as e:
+        logger.debug(f"Cannot get repository info: {e}")
         owner, repo = None, None
     pr_number = get_pr_number()
 

diff --git a/tests/scripts/end_to_end_test_async.py b/tests/scripts/end_to_end_test_async.py
@@ -1,12 +1,12 @@
 import os
-import pathlib
+from pathlib import Path
 
-from end_to_end_test_utilities import CoverageExpectation, TestConfig, run_codeflash_command, run_with_retries
+from tests.scripts.end_to_end_test_utilities import CoverageExpectation, TestConfig, run_codeflash_command, run_with_retries
 
 
 def run_test(expected_improvement_pct: int) -> bool:
     config = TestConfig(
-        file_path="main.py",
+        file_path=Path("main.py"),
         min_improvement_x=0.1,
         coverage_expectations=[
             CoverageExpectation(
@@ -17,7 +17,7 @@ def run_test(expected_improvement_pct: int) -> bool:
         ],
     )
     cwd = (
-        pathlib.Path(__file__).parent.parent.parent / "code_to_optimize" / "code_directories" / "async_e2e"
+        Path(__file__).parent.parent.parent / "code_to_optimize" / "code_directories" / "async_e2e"
     ).resolve()
     return run_codeflash_command(cwd, config, expected_improvement_pct)
 

diff --git a/tests/scripts/end_to_end_test_benchmark_sort.py b/tests/scripts/end_to_end_test_benchmark_sort.py
@@ -1,13 +1,13 @@
 import os
-import pathlib
+from pathlib import Path
 
-from end_to_end_test_utilities import CoverageExpectation, TestConfig, run_codeflash_command, run_with_retries
+from tests.scripts.end_to_end_test_utilities import CoverageExpectation, TestConfig, run_codeflash_command, run_with_retries
 
 
 def run_test(expected_improvement_pct: int) -> bool:
-    cwd = (pathlib.Path(__file__).parent.parent.parent / "code_to_optimize").resolve()
+    cwd = (Path(__file__).parent.parent.parent / "code_to_optimize").resolve()
     config = TestConfig(
-        file_path=pathlib.Path("bubble_sort.py"),
+        file_path=Path("bubble_sort.py"),
         function_name="sorter",
         benchmarks_root=cwd / "tests" / "pytest" / "benchmarks",
         min_improvement_x=0.70,

diff --git a/tests/scripts/end_to_end_test_bubblesort_pytest.py b/tests/scripts/end_to_end_test_bubblesort_pytest.py
@@ -1,12 +1,13 @@
 import os
-import pathlib
+from pathlib import Path
 
-from end_to_end_test_utilities import CoverageExpectation, TestConfig, run_codeflash_command, run_with_retries
+
+from tests.scripts.end_to_end_test_utilities import CoverageExpectation, TestConfig, run_codeflash_command, run_with_retries
 
 
 def run_test(expected_improvement_pct: int) -> bool:
     config = TestConfig(
-        file_path="bubble_sort.py",
+        file_path=Path("bubble_sort.py"),
         function_name="sorter",
         min_improvement_x=0.70,
         coverage_expectations=[
@@ -15,7 +16,7 @@ def run_test(expected_improvement_pct: int) -> bool:
             )
         ],
     )
-    cwd = (pathlib.Path(__file__).parent.parent.parent / "code_to_optimize").resolve()
+    cwd = (Path(__file__).parent.parent.parent / "code_to_optimize").resolve()
     return run_codeflash_command(
         cwd, config, expected_improvement_pct, ['print("codeflash stdout: Sorting list")', 'print(f"result: {arr}")']
     )

diff --git a/tests/scripts/end_to_end_test_bubblesort_unittest.py b/tests/scripts/end_to_end_test_bubblesort_unittest.py
@@ -1,14 +1,14 @@
 import os
-import pathlib
+from pathlib import Path
 
-from end_to_end_test_utilities import TestConfig, run_codeflash_command, run_with_retries
+from tests.scripts.end_to_end_test_utilities import TestConfig, run_codeflash_command, run_with_retries
 
 
 def run_test(expected_improvement_pct: int) -> bool:
     config = TestConfig(
-        file_path="bubble_sort.py", function_name="sorter", min_improvement_x=0.30
+        file_path=Path("bubble_sort.py"), function_name="sorter", min_improvement_x=0.30
     )
-    cwd = (pathlib.Path(__file__).parent.parent.parent / "code_to_optimize").resolve()
+    cwd = (Path(__file__).parent.parent.parent / "code_to_optimize").resolve()
     return run_codeflash_command(cwd, config, expected_improvement_pct)
 
 

diff --git a/tests/scripts/end_to_end_test_coverage.py b/tests/scripts/end_to_end_test_coverage.py
@@ -1,19 +1,20 @@
 import os
-import pathlib
+from pathlib import Path
 
-from end_to_end_test_utilities import CoverageExpectation, TestConfig, run_codeflash_command, run_with_retries
+
+from tests.scripts.end_to_end_test_utilities import CoverageExpectation, TestConfig, run_codeflash_command, run_with_retries
 
 
 def run_test(expected_improvement_pct: int) -> bool:
     config = TestConfig(
-        file_path="bubble_sort.py",
+        file_path=Path("bubble_sort.py"),
         function_name="sorter_one_level_depth",
         coverage_expectations=[
             CoverageExpectation(function_name="sorter_one_level_depth", expected_coverage=100.0, expected_lines=[2])
         ],
     )
     cwd = (
-        pathlib.Path(__file__).parent.parent.parent / "code_to_optimize" / "code_directories" / "my-best-repo"
+        Path(__file__).parent.parent.parent / "code_to_optimize" / "code_directories" / "my-best-repo"
     ).resolve()
     return run_codeflash_command(cwd, config, expected_improvement_pct)
 

diff --git a/tests/scripts/end_to_end_test_futurehouse.py b/tests/scripts/end_to_end_test_futurehouse.py
@@ -1,13 +1,18 @@
+from pathlib import Path
 import os
-import pathlib
 
-from end_to_end_test_utilities import CoverageExpectation, TestConfig, run_codeflash_command, run_with_retries
+from tests.scripts.end_to_end_test_utilities import (
+    CoverageExpectation,
+    TestConfig,
+    run_codeflash_command,
+    run_with_retries
+)
 
 
 def run_test(expected_improvement_pct: int) -> bool:
     config = TestConfig(
-        file_path="src/aviary/common_tags.py",
-        expected_unit_tests=0, # todo: fix bug https://linear.app/codeflash-ai/issue/CF-921/test-discovery-does-not-work-properly-for-e2e-futurehouse-example for context
+        file_path=Path("src/aviary/common_tags.py"),
+        expected_unit_tests=2,
         min_improvement_x=0.05,
         coverage_expectations=[
             CoverageExpectation(
@@ -17,10 +22,10 @@ def run_test(expected_improvement_pct: int) -> bool:
             )
         ],
     )
-    cwd = (
-        pathlib.Path(__file__).parent.parent.parent / "code_to_optimize" / "code_directories" / "futurehouse_structure"
+    future_house_working_dir = (
+        Path(__file__).parent.parent.parent / "code_to_optimize" / "code_directories" / "futurehouse_structure"
     ).resolve()
-    return run_codeflash_command(cwd, config, expected_improvement_pct)
+    return run_codeflash_command(future_house_working_dir, config, expected_improvement_pct)
 
 
 if __name__ == "__main__":

diff --git a/tests/scripts/end_to_end_test_init_optimization.py b/tests/scripts/end_to_end_test_init_optimization.py
@@ -1,12 +1,12 @@
 import os
-import pathlib
+from pathlib import Path
 
-from end_to_end_test_utilities import CoverageExpectation, TestConfig, run_codeflash_command, run_with_retries
+from tests.scripts.end_to_end_test_utilities import CoverageExpectation, TestConfig, run_codeflash_command, run_with_retries
 
 
 def run_test(expected_improvement_pct: int) -> bool:
     config = TestConfig(
-        file_path="remove_control_chars.py",
+        file_path=Path("remove_control_chars.py"),
         function_name="CharacterRemover.remove_control_characters",
         min_improvement_x=0.1,
         coverage_expectations=[
@@ -15,7 +15,7 @@ def run_test(expected_improvement_pct: int) -> bool:
             )
         ],
     )
-    cwd = (pathlib.Path(__file__).parent.parent.parent / "code_to_optimize").resolve()
+    cwd = (Path(__file__).parent.parent.parent / "code_to_optimize").resolve()
     return run_codeflash_command(cwd, config, expected_improvement_pct)
 
 

diff --git a/tests/scripts/end_to_end_test_topological_sort_worktree.py b/tests/scripts/end_to_end_test_topological_sort_worktree.py
@@ -1,12 +1,12 @@
 import os
-import pathlib
+from pathlib import Path
 
-from end_to_end_test_utilities import CoverageExpectation, TestConfig, run_codeflash_command, run_with_retries
+from tests.scripts.end_to_end_test_utilities import CoverageExpectation, TestConfig, run_codeflash_command, run_with_retries
 
 
 def run_test(expected_improvement_pct: int) -> bool:
     config = TestConfig(
-        file_path="topological_sort.py",
+        file_path=Path("topological_sort.py"),
         function_name="Graph.topologicalSort",
         min_improvement_x=0.05,
         use_worktree=True,
@@ -19,7 +19,7 @@ def run_test(expected_improvement_pct: int) -> bool:
         ],
         expected_unit_tests=1,
     )
-    cwd = (pathlib.Path(__file__).parent.parent.parent / "code_to_optimize").resolve()
+    cwd = (Path(__file__).parent.parent.parent / "code_to_optimize").resolve()
     return_var = run_codeflash_command(cwd, config, expected_improvement_pct)
     return return_var
 

diff --git a/tests/scripts/end_to_end_test_tracer_replay.py b/tests/scripts/end_to_end_test_tracer_replay.py
@@ -1,7 +1,7 @@
 import os
-import pathlib
+from pathlib import Path
 
-from end_to_end_test_utilities import CoverageExpectation, TestConfig, run_codeflash_command, run_with_retries
+from tests.scripts.end_to_end_test_utilities import CoverageExpectation, TestConfig, run_codeflash_command, run_with_retries
 
 
 def run_test(expected_improvement_pct: int) -> bool:
@@ -14,7 +14,7 @@ def run_test(expected_improvement_pct: int) -> bool:
         ],
     )
     cwd = (
-        pathlib.Path(__file__).parent.parent.parent / "code_to_optimize" / "code_directories" / "simple_tracer_e2e"
+       Path(__file__).parent.parent.parent / "code_to_optimize" / "code_directories" / "simple_tracer_e2e"
     ).resolve()
     return run_codeflash_command(cwd, config, expected_improvement_pct)
 

diff --git a/tests/scripts/end_to_end_test_utilities.py b/tests/scripts/end_to_end_test_utilities.py
@@ -7,6 +7,12 @@
 import time
 from dataclasses import dataclass, field
 from typing import Optional
+import contextlib
+
+try:
+    import tomllib
+except ImportError:
+    import tomli as tomllib
 
 
 @dataclass
@@ -82,7 +88,6 @@ def run_codeflash_command(
     logging.basicConfig(level=logging.INFO)
     if config.trace_mode:
         return run_trace_test(cwd, config, expected_improvement_pct)
-
     path_to_file = cwd / config.file_path
     file_contents = path_to_file.read_text("utf-8")
     pytest_dir = cwd / "tests" / "pytest"
@@ -102,7 +107,6 @@ def run_codeflash_command(
 
     return_code = process.wait()
     stdout = "".join(output)
-
     validated = validate_output(stdout, return_code, expected_improvement_pct, config)
     if not validated:
         # Write original file contents back to file
@@ -129,7 +133,20 @@ def build_command(
 
     if config.function_name:
         base_command.extend(["--function", config.function_name])
-    base_command.extend(["--tests-root", str(test_root), "--module-root", str(cwd)])
+
+    # Check if pyproject.toml exists with codeflash config - if so, don't override it
+    pyproject_path = cwd / "pyproject.toml"
+    has_codeflash_config = False
+    if pyproject_path.exists():
+        with contextlib.suppress(Exception):
+            with open(pyproject_path, "rb") as f:
+                pyproject_data = tomllib.load(f)
+                has_codeflash_config = "tool" in pyproject_data and "codeflash" in pyproject_data["tool"]
+
+    # Only pass --tests-root and --module-root if they're not configured in pyproject.toml
+    if not has_codeflash_config:
+        base_command.extend(["--tests-root", str(test_root), "--module-root", str(cwd)])
+
     if benchmarks_root:
         base_command.extend(["--benchmark", "--benchmarks-root", str(benchmarks_root)])
     if config.use_worktree:
@@ -164,7 +181,9 @@ def validate_output(stdout: str, return_code: int, expected_improvement_pct: int
         return False
 
     if config.expected_unit_tests is not None:
-        unit_test_match = re.search(r"Discovered (\d+) existing unit test file", stdout)
+        # Match the global test discovery message from optimizer.py which counts test invocations
+        # Format: "Discovered X existing unit tests and Y replay tests in Z.Zs at /path/to/tests"
+        unit_test_match = re.search(r"Discovered (\d+) existing unit tests? and \d+ replay tests? in [\d.]+s at", stdout)
         if not unit_test_match:
             logging.error("Could not find unit test count")
             return False