googleapis · hebaalazzeh · Jun 15, 2026 · Jun 15, 2026 · Jun 15, 2026 · Jun 15, 2026
@@ -0,0 +1,72 @@
+# Python SDK Import Profiler: Documentation & Breakdown
+
+This document provides a comprehensive guide to the `import_profiler` scripts, directory files, and how to analyze the generated import trace logs to target optimization areas.
+
+---
+
+## 1. File Guide & Directory Structure
+The profiling tool is located in the [scripts/import_profiler/](./) directory:
+
+* **[profiler.py](./profiler.py)**: The core executable script. It is designed as a single-file, self-spawning harness that performs process-isolated importing benchmarks and generates trace logs.
+
+---
+
+## 2. Profiler Mechanism (`profiler.py`)
+
+**Objective**
+The Profiler functions as a process-isolated verification harness designed to capture before-and-after metrics across three distinct vectors: Initialization Latency (ms), Peak Memory Usage (MB), and Dynamic Code Volume (Loaded Modules & Lines of Code).
+
+**Usage**
+
+Run this command to collect the metrics:
+```bash
+python profiler.py --module <target_module> --iterations <N>
+```
+
+**Expected Output**
+```text
+--- Results for <target_module> (<N> iterations) ---
+Code Volume (Deterministic):
+  Loaded Modules: <count>
+  Loaded Lines:   <count>
+Time (ms):
+  P50 (Median): <time>
+  P90:          <time>
+  P99:          <time>
+RAM (MB):
+  P50 (Median): <memory>
+  P90:          <memory>
+  P99:          <memory>
+```
+
+---
+
+## 3. How to Interpret Python `-X importtime` Trace Logs
+When running with the `--trace` flag, the script captures the raw stderr trace produced by Python's `-X importtime` option. The trace looks like this:
+
+```
+import time: self [us] | cumulative | imported package
+import time:       536 |        536 |   _io
+import time:      1077 |       2385 | _frozen_importlib_external
+import time:    773659 |     793010 |                   google.cloud.compute_v1.types.compute
+```
+
+### Explaining the Fields:
+1. **`self [us]` (Microseconds):** The time spent importing the module itself, *excluding* any time spent importing its child dependencies.
+2. **`cumulative` (Microseconds):** The total time spent loading the module *including* all nested imports. This represents the total wait time introduced by this line.
+3. **Hierarchy Indentation:** Indented packages are sub-imports triggered by the parent module. A package with higher indentation is loaded deeper in the call stack.
+
+---
+
+## 4. Execution Reference
+Ensure you are in the correct pyenv virtual environment where packages are installed in editable mode:
+
+```bash
+# 1. Run the profiler to get baseline/optimized outcomes (e.g. 5 iterations)
+PYENV_VERSION=py312 python profiler.py --module=google.cloud.compute --iterations=5
+PYENV_VERSION=py312 python profiler.py --module=google.cloud.aiplatform --iterations=5
+
+# 2. Run the profiler to generate trace logs
+PYENV_VERSION=py312 python profiler.py --module=google.cloud.compute --trace
+PYENV_VERSION=py312 python profiler.py --module=google.cloud.aiplatform --trace
+```
@@ -0,0 +1,263 @@
+import sys
+import json
+import time
+import subprocess
+import statistics
+import tracemalloc
+import importlib
+import importlib.util
+import csv
+import os
+import logging
+
+def run_worker(target_module):
+    """Performs ONE import and returns metrics."""
+    tracemalloc.start()
+    start_time = time.perf_counter()
+
+    modules_before = set(sys.modules.keys())
+
+    # --- TARGET IMPORT ---
+    importlib.import_module(target_module)
+    # ---------------------
+
+    end_time = time.perf_counter()
+    _, peak = tracemalloc.get_traced_memory()
+    tracemalloc.stop()
+
+    modules_after = set(sys.modules.keys())
+    new_modules = modules_after - modules_before
+
+    loaded_lines = 0
+    for m in new_modules:
+        mod = sys.modules.get(m)
+        if mod and getattr(mod, '__file__', None):
+            file_path = mod.__file__
-        if mod and getattr(mod, '__file__', None):
-            file_path = mod.__file__
+        if mod and isinstance(getattr(mod, '__file__', None), str):
+            file_path = mod.__file__
-        if mod and getattr(mod, '__file__', None):
-            file_path = mod.__file__
+        if mod and isinstance(getattr(mod, '__file__', None), str):
+            file_path = mod.__file__
+            if file_path.endswith('.pyc'):
+                try:
+                    file_path = importlib.util.source_from_cache(file_path)
+                except ValueError:
+                    pass
+            if file_path.endswith('.py'):
+                try:
+                    with open(file_path, 'r', encoding='utf-8', errors='ignore') as f:
+                        loaded_lines += sum(1 for _ in f)
+                except Exception as e:
+                    logging.warning(f"Failed to read lines from {file_path}: {e}")
+
+    # Output to stdout for the Master to capture
+    metrics = {
+        "time_ms": (end_time - start_time) * 1000,
+        "peak_ram_mb": peak / (1024 * 1024),
+        "loaded_modules": len(new_modules),
+        "loaded_lines": loaded_lines
+    }
+    print(f"__METRICS__:{json.dumps(metrics)}")
+
+def _run_worker_and_parse(cmd):
+    result = subprocess.run(cmd, capture_output=True, text=True, check=True)
+    try:
+        lines = result.stdout.strip().splitlines()
+        data = None
+        for line in reversed(lines):
+            if line.startswith("__METRICS__:"):
+                data = json.loads(line[len("__METRICS__:"):])
+                break
+        if data is None:
+            raise ValueError("Worker did not output metrics JSON.")
+        for key in ("time_ms", "peak_ram_mb", "loaded_modules", "loaded_lines"):
+            if key not in data:
+                raise KeyError(f"Missing key '{key}' in worker output")
+        return data
+    except (json.JSONDecodeError, IndexError, KeyError, ValueError) as parse_err:
+        print(f"Error parsing worker output: {parse_err}", file=sys.stderr)
+        print(f"Worker stdout:\n{result.stdout}", file=sys.stderr)
+        print(f"Worker stderr:\n{result.stderr}", file=sys.stderr)
+        raise parse_err
+
+def run_master(iterations, target_module, cpu="0", csv_path=None):
+    """Orchestrates the benchmark."""
+    if iterations < 1:
+        raise ValueError("Number of iterations must be at least 1.")
+    times, memories = [], []
+    loaded_modules_val, loaded_lines_val = 0, 0
+
+    print(f"Profiling start... Running {iterations} cold-start iterations for {target_module}.")
+    if cpu.lower() != "none":
+        print(f"CPU Pinning enabled: Pinning processes to core {cpu} using taskset.")
+    else:
+        print("CPU Pinning disabled.")
+
+    for i in range(iterations):
+        # Build command line
+        cmd = []
+        if cpu.lower() != "none":
+            cmd += ["taskset", "-c", cpu]
+
+        cmd += [sys.executable, __file__, "--worker", f"--module={target_module}"]
+
+        try:
+            data = _run_worker_and_parse(cmd)
+            times.append(data["time_ms"])
+            memories.append(data["peak_ram_mb"])
+            loaded_modules_val = data["loaded_modules"]
+            loaded_lines_val = data["loaded_lines"]
+        except FileNotFoundError as e:
+            if cpu.lower() != "none" and i == 0:
+                print("WARNING: taskset CPU pinning is not available. Falling back to unpinned execution...")
+                cpu = "none"
+                cmd = [sys.executable, __file__, "--worker", f"--module={target_module}"]
+                try:
+                    data = _run_worker_and_parse(cmd)
+                    times.append(data["time_ms"])
+                    memories.append(data["peak_ram_mb"])
+                    loaded_modules_val = data["loaded_modules"]
+                    loaded_lines_val = data["loaded_lines"]
+                except subprocess.CalledProcessError as err:
+                    print(f"Error in worker process:\n{err.stderr}", file=sys.stderr)
+                    raise err
+            else:
+                raise e
+        except subprocess.CalledProcessError as e:
+            print(f"Error in worker process:\n{e.stderr}", file=sys.stderr)
+            raise e
+
+    # Write CSV if requested
+    if csv_path:
+        with open(csv_path, "w", newline="", encoding="utf-8") as f:
+            writer = csv.writer(f)
+            writer.writerow(["Iteration", "Time (ms)", "Peak RAM (MB)"])
+            for idx, (t, m) in enumerate(zip(times, memories)):
+                writer.writerow([idx + 1, f"{t:.2f}", f"{m:.4f}"])
+        print(f"Raw metrics successfully exported to CSV: {csv_path}")
+
+    # Compute percentiles (P50, P90, P99)
+    # statistics.quantiles returns 99 cut points for n=100
+    if len(times) > 1:
+        q_time = statistics.quantiles(times, n=100)
+        p50_time, p90_time, p99_time = q_time[49], q_time[89], q_time[98]
+    else:
+        p50_time = p90_time = p99_time = times[0] if times else 0.0
+
+    if len(memories) > 1:
+        q_mem = statistics.quantiles(memories, n=100)
+        p50_mem, p90_mem, p99_mem = q_mem[49], q_mem[89], q_mem[98]
+    else:
+        p50_mem = p90_mem = p99_mem = memories[0] if memories else 0.0
+
+    print(f"\n--- Results for {target_module} ({iterations} iterations) ---")
+    print(f"Code Volume (Deterministic):")
+    print(f"  Loaded Modules: {loaded_modules_val}")
+    print(f"  Loaded Lines:   {loaded_lines_val}")
+    print(f"Time (ms):")
+    print(f"  P50 (Median): {p50_time:.2f}")
+    print(f"  P90:          {p90_time:.2f}")
+    print(f"  P99:          {p99_time:.2f}")
+    print(f"  Mean:         {statistics.mean(times):.2f}")
+    print(f"  Min:          {min(times):.2f}")
+    print(f"  Max:          {max(times):.2f}")
+    if len(times) > 1:
+        print(f"  StdDev:       {statistics.stdev(times):.2f}")
+
+    print(f"RAM (MB):")
+    print(f"  P50 (Median): {p50_mem:.4f}")
+    print(f"  P90:          {p90_mem:.4f}")
+    print(f"  P99:          {p99_mem:.4f}")
+    print(f"  Mean:         {statistics.mean(memories):.4f}")
+    print(f"  Min:          {min(memories):.4f}")
+    print(f"  Max:          {max(memories):.4f}")
+    if len(memories) > 1:
+        print(f"  StdDev:       {statistics.stdev(memories):.4f}")
+
+def run_trace(target_module):
+    """Generates importtime trace log and writes it to a file."""
+    trace_file = f"import_trace_{target_module.replace('.', '_')}.log"
+    print(f"Generating importtime trace log for {target_module} -> {trace_file}...")
+
+    # We run: python -X importtime -c "import importlib; importlib.import_module(...)"
+    result = subprocess.run(
+        [sys.executable, "-X", "importtime", "-c", f"import importlib; importlib.import_module({json.dumps(target_module)})"],
+        capture_output=True, text=True
+    )
+    if result.returncode != 0:
+        print(f"WARNING: Import failed with exit code {result.returncode}. The trace log may be incomplete or contain errors.", file=sys.stderr)
+        if result.stdout:
+            print(f"Worker stdout:\n{result.stdout}", file=sys.stderr)
+        if result.stderr:
+            print(f"Worker stderr:\n{result.stderr}", file=sys.stderr)
+
+    with open(trace_file, "w", encoding="utf-8") as f:
+        f.write(result.stderr)
+
+    print(f"Trace log successfully written to {trace_file}")
+
+def run_cprofile(target_module):
+    """Runs cProfile in a clean subprocess to capture stack traces for latency."""
+    import pstats
+
+    prof_file = f"cprofile_{target_module.replace('.', '_')}.prof"
+    print(f"Generating cProfile data for {target_module} -> {prof_file}...")
+
+    # Run profiling in a clean subprocess to ensure cold-start
+    result = subprocess.run(
+        [sys.executable, "-m", "cProfile", "-o", prof_file, "-c", f"import importlib; importlib.import_module({json.dumps(target_module)})"],
+        capture_output=True, text=True
+    )
+    if result.returncode != 0:
+        print(f"Error generating cProfile data:\n{result.stderr}", file=sys.stderr)
+        return
+
+    print(f"cProfile stats successfully written to {prof_file}")
+
+    # Print top bottlenecks
+    print("\n--- Top 15 functions by cumulative time ---")
+    ps = pstats.Stats(prof_file).sort_stats(pstats.SortKey.CUMULATIVE)
+    ps.print_stats(15)
+
+def run_mprofile(target_module):
+    """Runs tracemalloc snapshot in a clean subprocess to see where memory is allocated."""
+    print(f"Generating tracemalloc memory snapshot for {target_module}...")
+
+    code = (
+        "import tracemalloc\n"
+        "import importlib\n"
+        "tracemalloc.start()\n"
+        f"importlib.import_module({json.dumps(target_module)})\n"
+        "snapshot = tracemalloc.take_snapshot()\n"
+        "tracemalloc.stop()\n"
+        "top_stats = snapshot.statistics('lineno')\n"
+        "for stat in top_stats[:15]:\n"
+        "    print(stat)\n"
+    )
+    result = subprocess.run([sys.executable, "-c", code], capture_output=True, text=True)
+    if result.returncode != 0:
+        print(f"Error generating memory snapshot:\n{result.stderr}", file=sys.stderr)
+    else:
+        print("\n--- Top 15 memory allocations by line ---")
+        print(result.stdout, end="")
+
+if __name__ == "__main__":
+    import argparse
+    parser = argparse.ArgumentParser(description="Python SDK Import Profiler")
+    parser.add_argument("--module", default="google.cloud.compute", help="Target module to profile")
+    parser.add_argument("--iterations", type=int, default=50, help="Number of iterations")
+    default_cpu = "0" if sys.platform.startswith("linux") else "none"
+    parser.add_argument("--cpu", default=default_cpu, help="CPU core to pin to (or 'none')")
+    parser.add_argument("--csv", help="Path to export CSV results")
+    parser.add_argument("--trace", action="store_true", help="Generate importtime trace log")
+    parser.add_argument("--cprofile", action="store_true", help="Run cProfile")
+    parser.add_argument("--mprofile", action="store_true", help="Run tracemalloc memory snapshot")
+    parser.add_argument("--worker", action="store_true", help=argparse.SUPPRESS)
+
+    args = parser.parse_args()
+
+    if args.worker:
+        run_worker(args.module)
+    elif args.trace:
+        run_trace(args.module)
+    elif args.cprofile:
+        run_cprofile(args.module)
+    elif args.mprofile:
+        run_mprofile(args.module)
+    else:
+        run_master(args.iterations, args.module, args.cpu, args.csv)