feat(js): add JavaScript function tracer with Babel instrumentation #1377

claude · 2026-02-04T10:36:25Z

⚠️ Still not fixed: Silent exception handling at line 296. Catching all exceptions without logging makes debugging failures impossible. If database parsing fails, users won't know why.

Suggested fix:

except Exception as e: logger.exception(f"Failed to get traced functions from {trace_file}: {e}") return []

-Original file line number
+Diff line change
@@ Expand Up / @@ -47,4 +47,5 @@ jobs: @@
               uv run pytest tests/test_languages/test_vitest_e2e.py -v
               uv run pytest tests/test_languages/test_javascript_e2e.py -v
               uv run pytest tests/test_languages/test_javascript_support.py -v
+              uv run pytest tests/test_languages/test_javascript_tracer.py -v
               uv run pytest tests/code_utils/test_config_js.py -v

-Original file line number
+Diff line change
@@ Expand Up / @@ -1585,30 +1585,21 @@ def instrument_for_behavior( @@
         ) -> str:
             """Add behavior instrumentation to capture inputs/outputs.
-            For JavaScript, this wraps functions to capture their arguments
-            and return values.
+            For JavaScript, instrumentation is handled at runtime by the Babel tracer plugin
+            (babel-tracer-plugin.js) via trace-runner.js. This method returns the source
+            unchanged since no source-level transformation is needed.
             Args:
                 source: Source code to instrument.
                 functions: Functions to add tracing to.
                 output_file: Optional output file for traces.
             Returns:
-                Instrumented source code.
+                Source code unchanged (Babel handles instrumentation at runtime).
             """
-            if not functions:
-                return source
-            from codeflash.languages.javascript.tracer import JavaScriptTracer
-            # Use first function's file path if output_file not specified
-            if output_file is None:
-                file_path = functions[0].file_path
-                output_file = file_path.parent / ".codeflash" / "traces.db"
-            tracer = JavaScriptTracer(output_file)
-            return tracer.instrument_source(source, functions[0].file_path, list(functions))
+            # JavaScript tracing is done at runtime via Babel plugin, not source transformation
+            return source
         def instrument_for_benchmarking(self, test_source: str, target_function: FunctionToOptimize) -> str:
             """Add timing instrumentation to test code.
@@ Expand Down @@

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

feat(js): add JavaScript function tracer with Babel instrumentation #1377

Uh oh!

Diff view

Diff view

There are no files selected for viewing

Uh oh!

claude bot Feb 4, 2026 •

edited

Loading

Uh oh!

Uh oh!

Uh oh!

-Original file line number
+Diff line change
@@ -0,0 +1,340 @@
+    """JavaScript replay test generation.
+    This module provides functionality to generate replay tests from traced JavaScript
+    function calls. Replay tests allow verifying that optimized code produces the same
+    results as the original code.
+    The generated tests can be run with Jest or Vitest, depending on the project's
+    test framework configuration.
+    """
+    from __future__ import annotations
+    import json
+    import sqlite3
+    import textwrap
+    from dataclasses import dataclass
+    from pathlib import Path
+    from typing import TYPE_CHECKING, Any, Optional
+    if TYPE_CHECKING:
+        from collections.abc import Generator
+    @dataclass
+    class JavaScriptFunctionModule:
+        """Information about a traced JavaScript function for replay test generation."""
+        function_name: str
+        file_name: Path
+        module_name: str
+        class_name: Optional[str] = None
+        line_no: Optional[int] = None
+    def get_next_arg_and_return(
+        trace_file: str, function_name: str, file_name: str, class_name: Optional[str] = None, num_to_get: int = 25
+    ) -> Generator[Any]:
+        """Get traced function arguments from the database.
+        This mirrors the Python version in codeflash/tracing/replay_test.py.
+        Args:
+            trace_file: Path to the trace SQLite database.
+            function_name: Name of the function.
+            file_name: Path to the source file.
+            class_name: Optional class name for methods.
+            num_to_get: Maximum number of traces to retrieve.
+        Yields:
+            Serialized argument data for each traced call.
+        """
+        db = sqlite3.connect(trace_file)
+        cur = db.cursor()
+        # Try the new schema first (function_calls table)
+        try:
+            cur.execute("SELECT name FROM sqlite_master WHERE type='table'")
+            tables = {row[0] for row in cur.fetchall()}
+            if "function_calls" in tables:
+                if class_name:
+                    cursor = cur.execute(
+                        "SELECT args FROM function_calls WHERE function = ? AND filename = ? AND classname = ? AND type = 'call' ORDER BY time_ns ASC LIMIT ?",
+                        (function_name, file_name, class_name, num_to_get),
+                    )
+                else:
+                    cursor = cur.execute(
+                        "SELECT args FROM function_calls WHERE function = ? AND filename = ? AND type = 'call' ORDER BY time_ns ASC LIMIT ?",
+                        (function_name, file_name, num_to_get),
+                    )
+                while (val := cursor.fetchone()) is not None:
+                    # args is stored as JSON or binary blob
+                    args_data = val[0]
+                    if isinstance(args_data, bytes):
+                        yield args_data
+                    else:
+                        yield args_data
+            elif "traces" in tables:
+                # Legacy schema
+                if class_name:
+                    cursor = cur.execute(
+                        "SELECT args FROM traces WHERE function = ? AND file = ? ORDER BY id ASC LIMIT ?",
+                        (function_name, file_name, num_to_get),
+                    )
+                else:
+                    cursor = cur.execute(
+                        "SELECT args FROM traces WHERE function = ? AND file = ? ORDER BY id ASC LIMIT ?",
+                        (function_name, file_name, num_to_get),
+                    )
+                while (val := cursor.fetchone()) is not None:
+                    yield val[0]
+        finally:
+            db.close()
+    def get_function_alias(module: str, function_name: str, class_name: Optional[str] = None) -> str:
+        """Generate a unique alias for a function import.
+        Args:
+            module: Module path.
+            function_name: Function name.
+            class_name: Optional class name.
+        Returns:
+            A valid JavaScript identifier for the function.
+        """
+        import re
+        # Normalize module path to valid identifier
+        module_alias = re.sub(r"[^a-zA-Z0-9]", "_", module).strip("_")
+        if class_name:
+            return f"{module_alias}_{class_name}_{function_name}"
+        return f"{module_alias}_{function_name}"
+    def create_javascript_replay_test(
+        trace_file: str,
+        functions: list[JavaScriptFunctionModule],
+        max_run_count: int = 100,
+        framework: str = "jest",
+        project_root: Optional[Path] = None,
+    ) -> str:
+        """Generate a JavaScript replay test file from traced function calls.
+        This mirrors the Python version in codeflash/tracing/replay_test.py but
+        generates JavaScript test code for Jest or Vitest.
+        Args:
+            trace_file: Path to the trace SQLite database.
+            functions: List of functions to generate tests for.
+            max_run_count: Maximum number of test cases per function.
+            framework: Test framework ('jest' or 'vitest').
+            project_root: Project root for calculating relative imports.
+        Returns:
+            Generated test file content as a string.
+        """
+        is_vitest = framework.lower() == "vitest"
+        # Build imports section
+        imports = []
+        if is_vitest:
+            imports.append("import { describe, test } from 'vitest';")
+        imports.append("const { getNextArg } = require('codeflash/replay');")
+        imports.append("")
+        # Build function imports
+        for func in functions:
+            if func.function_name in ("__init__", "constructor"):
+                # Skip constructors
+                continue
+            alias = get_function_alias(func.module_name, func.function_name, func.class_name)
+            if func.class_name:
+                imports.append(f"const {{ {func.class_name}: {alias}_class }} = require('./{func.module_name}');")
+            else:
+                imports.append(f"const {{ {func.function_name}: {alias} }} = require('./{func.module_name}');")
+        imports.append("")
+        # Metadata
+        functions_to_test = [f.function_name for f in functions if f.function_name not in ("__init__", "constructor")]
+        metadata = f"""const traceFilePath = '{trace_file}';
+    const functions = {json.dumps(functions_to_test)};
+    """
+        # Build test cases
+        test_cases = []
+        for func in functions:
+            if func.function_name in ("__init__", "constructor"):
+                continue
+            alias = get_function_alias(func.module_name, func.function_name, func.class_name)
+            test_name = f"{func.class_name}.{func.function_name}" if func.class_name else func.function_name
+            if func.class_name:
+                # Method test - need to instantiate the class
+                class_arg = f"'{func.class_name}'"
+                test_body = textwrap.dedent(f"""
+    describe('Replay: {test_name}', () => {{
+        const traces = getNextArg(traceFilePath, '{func.function_name}', '{func.file_name.as_posix()}', {max_run_count}, {class_arg});
+        test.each(traces.map((args, i) => [i, args]))('call %i', (index, args) => {{
+            // For instance methods, we need to create an instance
+            // The traced args may include 'this' context as first argument
+            const instance = new {alias}_class();
+            instance.{func.function_name}(...args);
+        }});
+    }});
+    """)
+            else:
+                # Regular function test
+                test_body = textwrap.dedent(f"""
+    describe('Replay: {test_name}', () => {{
+        const traces = getNextArg(traceFilePath, '{func.function_name}', '{func.file_name.as_posix()}', {max_run_count});
+        test.each(traces.map((args, i) => [i, args]))('call %i', (index, args) => {{
+            {alias}(...args);
+        }});
+    }});
+    """)
+            test_cases.append(test_body)
+        # Combine all parts
+        return "\n".join(
+            [
+                "// Auto-generated replay test by Codeflash",
+                "// Do not edit this file directly",
+                "",
+                *imports,
+                metadata,
+                *test_cases,
+            ]
+        )
+    def get_traced_functions_from_db(trace_file: Path) -> list[JavaScriptFunctionModule]:
+        """Get list of functions that were traced from the database.
+        Args:
+            trace_file: Path to trace database.
+        Returns:
+            List of traced function information.
+        """
+        if not trace_file.exists():
+            return []
+        try:
+            conn = sqlite3.connect(trace_file)
+            cursor = conn.cursor()
+            # Check schema
+            cursor.execute("SELECT name FROM sqlite_master WHERE type='table'")
+            tables = {row[0] for row in cursor.fetchall()}
+            functions = []
+            if "function_calls" in tables:
+                cursor.execute(
+                    "SELECT DISTINCT function, filename, classname, line_number FROM function_calls WHERE type = 'call'"
+                )
+                for row in cursor.fetchall():
+                    func_name = row[0]
+                    file_name = row[1]
+                    class_name = row[2]
+                    line_number = row[3]
+                    # Calculate module path from filename
+                    module_path = file_name.replace("\\", "/").replace(".js", "").replace(".ts", "")
+                    module_path = module_path.removeprefix("./")
+                    functions.append(
+                        JavaScriptFunctionModule(
+                            function_name=func_name,
+                            file_name=Path(file_name),
+                            module_name=module_path,
+                            class_name=class_name,
+                            line_no=line_number,
+                        )
+                    )
+            elif "traces" in tables:
+                # Legacy schema
+                cursor.execute("SELECT DISTINCT function, file FROM traces")
+                for row in cursor.fetchall():
+                    func_name = row[0]
+                    file_name = row[1]
+                    module_path = file_name.replace("\\", "/").replace(".js", "").replace(".ts", "")
+                    module_path = module_path.removeprefix("./")
+                    functions.append(
+                        JavaScriptFunctionModule(
+                            function_name=func_name, file_name=Path(file_name), module_name=module_path
+                        )
+                    )
+            conn.close()
+            return functions
+        except Exception:
+            return []
+    def create_replay_test_file(
+        trace_file: Path,
+        output_path: Path,
+        framework: str = "jest",
+        max_run_count: int = 100,
+        project_root: Optional[Path] = None,
+    ) -> Optional[Path]:
+        """Generate a replay test file from a trace database.
+        This is the main entry point for creating JavaScript replay tests.
+        Args:
+            trace_file: Path to the trace SQLite database.
+            output_path: Path to write the test file.
+            framework: Test framework ('jest' or 'vitest').
+            max_run_count: Maximum number of test cases per function.
+            project_root: Project root for calculating relative imports.
+        Returns:
+            Path to generated test file, or None if generation failed.
+        """
+        functions = get_traced_functions_from_db(trace_file)
+        if not functions:
+            return None
+        content = create_javascript_replay_test(
+            trace_file=str(trace_file),
+            functions=functions,
+            max_run_count=max_run_count,
+            framework=framework,
+            project_root=project_root,
+        )
+        try:
+            output_path.parent.mkdir(parents=True, exist_ok=True)
+            output_path.write_text(content)
+            return output_path
+        except Exception:
+            return None

feat(js): add JavaScript function tracer with Babel instrumentation #1377

Are you sure you want to change the base?

Uh oh!

feat(js): add JavaScript function tracer with Babel instrumentation #1377

Uh oh!

Uh oh!

Diff view

Diff view

There are no files selected for viewing

Uh oh!

claude bot Feb 4, 2026 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Uh oh!

Uh oh!

claude bot Feb 4, 2026 •

edited

Loading