From cc98795c1628be67493487ae228c57475be75cd8 Mon Sep 17 00:00:00 2001
From: stonelv <zhe.lv.82@gmail.com>
Date: Sun, 3 May 2026 13:06:08 +0800
Subject: [PATCH] cache by dogfooding round 1

---
 .gitignore                                |   1 +
 examples/KerasGA/benchmark_reuse_model.py | 145 ++++++++++++++++++++++
 pygad/kerasga/__init__.py                 |   8 +-
 pygad/kerasga/kerasga.py                  |  57 ++++++++-
 4 files changed, 206 insertions(+), 5 deletions(-)
 create mode 100644 examples/KerasGA/benchmark_reuse_model.py

diff --git a/.gitignore b/.gitignore
index 4a84706..35b647d 100644
--- a/.gitignore
+++ b/.gitignore
@@ -8,3 +8,4 @@
 __pycache__/
 *.py[cod]
 *$py.class
+.venv/*
diff --git a/examples/KerasGA/benchmark_reuse_model.py b/examples/KerasGA/benchmark_reuse_model.py
new file mode 100644
index 0000000..1fac956
--- /dev/null
+++ b/examples/KerasGA/benchmark_reuse_model.py
@@ -0,0 +1,145 @@
+import time
+import numpy
+import tensorflow.keras
+import pygad.kerasga
+
+
+def create_test_model(input_shape=(3,), output_units=1):
+    input_layer = tensorflow.keras.layers.Input(input_shape)
+    dense_layer1 = tensorflow.keras.layers.Dense(32, activation="relu")(input_layer)
+    dense_layer2 = tensorflow.keras.layers.Dense(16, activation="relu")(dense_layer1)
+    output_layer = tensorflow.keras.layers.Dense(output_units, activation="linear")(dense_layer2)
+    return tensorflow.keras.Model(inputs=input_layer, outputs=output_layer)
+
+
+def create_test_data(num_samples=1000, input_shape=(3,)):
+    numpy.random.seed(42)
+    data_inputs = numpy.random.rand(num_samples, *input_shape)
+    data_outputs = numpy.random.rand(num_samples, 1)
+    return data_inputs, data_outputs
+
+
+def benchmark_predict(model, solution, data, num_calls=100, reuse_mode=None, reuse_model_instance=None):
+    pygad.kerasga.clear_model_cache()
+    
+    times = []
+    predictions_list = []
+    
+    for i in range(num_calls):
+        start = time.perf_counter()
+        
+        if reuse_model_instance is not None:
+            pred = pygad.kerasga.predict(
+                model=model,
+                solution=solution,
+                data=data,
+                reuse_model=reuse_model_instance
+            )
+        else:
+            pred = pygad.kerasga.predict(
+                model=model,
+                solution=solution,
+                data=data,
+                reuse_model=reuse_mode
+            )
+        
+        end = time.perf_counter()
+        times.append(end - start)
+        predictions_list.append(pred)
+    
+    return times, predictions_list
+
+
+def main():
+    print("=" * 60)
+    print("KerasGA predict() 缓存复用基准测试")
+    print("=" * 60)
+    
+    numpy.random.seed(42)
+    
+    print("\n[1/4] 创建测试模型和数据...")
+    model = create_test_model()
+    data_inputs, data_outputs = create_test_data(num_samples=100)
+    
+    keras_ga = pygad.kerasga.KerasGA(model=model, num_solutions=10)
+    solution = keras_ga.population_weights[0]
+    
+    NUM_CALLS = 50
+    
+    print(f"\n[2/4] 开始基准测试 (每个模式调用 {NUM_CALLS} 次)...")
+    
+    print("\n  模式 A: reuse_model=None (默认 - 每次 clone_model)")
+    times_none, preds_none = benchmark_predict(
+        model, solution, data_inputs, 
+        num_calls=NUM_CALLS, reuse_mode=None
+    )
+    avg_time_none = numpy.mean(times_none)
+    total_time_none = numpy.sum(times_none)
+    print(f"    平均单次: {avg_time_none*1000:.2f} ms")
+    print(f"    总计: {total_time_none:.4f} s")
+    
+    print("\n  模式 B: reuse_model=True (自动缓存克隆模型)")
+    times_cache, preds_cache = benchmark_predict(
+        model, solution, data_inputs, 
+        num_calls=NUM_CALLS, reuse_mode=True
+    )
+    avg_time_cache = numpy.mean(times_cache)
+    total_time_cache = numpy.sum(times_cache)
+    print(f"    平均单次: {avg_time_cache*1000:.2f} ms")
+    print(f"    总计: {total_time_cache:.4f} s")
+    
+    print("\n  模式 C: reuse_model=user_model (用户提供复用模型)")
+    user_reuse_model = tensorflow.keras.models.clone_model(model)
+    times_user, preds_user = benchmark_predict(
+        model, solution, data_inputs, 
+        num_calls=NUM_CALLS, reuse_model_instance=user_reuse_model
+    )
+    avg_time_user = numpy.mean(times_user)
+    total_time_user = numpy.sum(times_user)
+    print(f"    平均单次: {avg_time_user*1000:.2f} ms")
+    print(f"    总计: {total_time_user:.4f} s")
+    
+    print("\n[3/4] 性能对比...")
+    speedup_cache = avg_time_none / avg_time_cache if avg_time_cache > 0 else float('inf')
+    speedup_user = avg_time_none / avg_time_user if avg_time_user > 0 else float('inf')
+    
+    print(f"\n  模式 B (自动缓存) 相对模式 A 加速: {speedup_cache:.2f}x")
+    print(f"  模式 C (用户模型) 相对模式 A 加速: {speedup_user:.2f}x")
+    
+    print("\n[4/4] 验证输出一致性...")
+    
+    all_close_cache = numpy.allclose(preds_none[0], preds_cache[0])
+    max_diff_cache = numpy.max(numpy.abs(preds_none[0] - preds_cache[0]))
+    
+    all_close_user = numpy.allclose(preds_none[0], preds_user[0])
+    max_diff_user = numpy.max(numpy.abs(preds_none[0] - preds_user[0]))
+    
+    print(f"\n  模式 A 与 模式 B 输出一致: {all_close_cache}")
+    print(f"  最大差异: {max_diff_cache:.2e}")
+    
+    print(f"\n  模式 A 与 模式 C 输出一致: {all_close_user}")
+    print(f"  最大差异: {max_diff_user:.2e}")
+    
+    print("\n" + "=" * 60)
+    print("基准测试完成")
+    print("=" * 60)
+    
+    print("\n详细统计:")
+    print(f"{'模式':<30} {'平均(ms)':<12} {'总计(s)':<10} {'加速比':<10}")
+    print("-" * 60)
+    print(f"{'A: reuse_model=None (每次clone)':<30} {avg_time_none*1000:<12.2f} {total_time_none:<10.4f} {'1.00x':<10}")
+    print(f"{'B: reuse_model=True (自动缓存)':<30} {avg_time_cache*1000:<12.2f} {total_time_cache:<10.4f} {speedup_cache:.2f}x")
+    print(f"{'C: reuse_model=实例 (用户提供)':<30} {avg_time_user*1000:<12.2f} {total_time_user:<10.4f} {speedup_user:.2f}x")
+    
+    print("\n一致性检查结果:")
+    if all_close_cache and all_close_user:
+        print("  ✓ 所有模式输出完全一致")
+    else:
+        print("  ✗ 警告: 存在输出不一致的情况")
+    
+    pygad.kerasga.clear_model_cache()
+    return all_close_cache and all_close_user
+
+
+if __name__ == "__main__":
+    main()
diff --git a/pygad/kerasga/__init__.py b/pygad/kerasga/__init__.py
index 8f5b353..33d63ff 100644
--- a/pygad/kerasga/__init__.py
+++ b/pygad/kerasga/__init__.py
@@ -1,3 +1,9 @@
-from .kerasga import *
+from .kerasga import (
+    KerasGA,
+    model_weights_as_vector,
+    model_weights_as_matrix,
+    predict,
+    clear_model_cache,
+)
 
 __version__ = "1.3.1"
diff --git a/pygad/kerasga/kerasga.py b/pygad/kerasga/kerasga.py
index 738e971..926f610 100644
--- a/pygad/kerasga/kerasga.py
+++ b/pygad/kerasga/kerasga.py
@@ -2,6 +2,9 @@
 import numpy
 import tensorflow.keras
 
+_model_cache = {}
+
+
 def model_weights_as_vector(model):
     """
     Reshapes the Keras model weight as a vector.
@@ -72,7 +75,8 @@ def predict(model,
             data, 
             batch_size=None,
             verbose=0,
-            steps=None):
+            steps=None,
+            reuse_model=None):
     """
     Use the PyGAD's solution to make predictions using the Keras model.
 
@@ -90,6 +94,15 @@ def predict(model,
         Verbosity mode. The default is 0. Check documentation of the Keras Model.predict() method for more information.
     steps : TYPE, optional
         The total number of steps (batches of samples). The default is None. Check documentation of the Keras Model.predict() method for more information.
+    reuse_model : None, bool, or tensorflow.keras.Model, optional
+        Controls model cloning behavior to reduce overhead:
+        - None or False (default): Always clone the model using clone_model() for each prediction.
+          This preserves the original behavior but may be slower for frequent predictions.
+        - True: Automatically cache and reuse a single cloned model instance. The model is cloned
+          only once (on first call) and subsequent calls only update its weights. This is much
+          faster but uses a module-level cache keyed by the original model's id().
+        - A Keras Model instance: Directly reuse the provided model instance. Only its weights
+          are updated. This gives the user full control over the cached model's lifecycle.
 
     Returns
     -------
@@ -97,11 +110,24 @@ def predict(model,
         The Keras model predictions.
 
     """
-    # Fetch the parameters of the best solution.
+    global _model_cache
+    
     solution_weights = model_weights_as_matrix(model=model,
                                                weights_vector=solution)
-    _model = tensorflow.keras.models.clone_model(model)
-    _model.set_weights(solution_weights)
+    
+    if reuse_model is None or reuse_model is False:
+        _model = tensorflow.keras.models.clone_model(model)
+        _model.set_weights(solution_weights)
+    elif reuse_model is True:
+        model_id = id(model)
+        if model_id not in _model_cache:
+            _model_cache[model_id] = tensorflow.keras.models.clone_model(model)
+        _model = _model_cache[model_id]
+        _model.set_weights(solution_weights)
+    else:
+        _model = reuse_model
+        _model.set_weights(solution_weights)
+    
     predictions = _model.predict(x=data,
                                  batch_size=batch_size,
                                  verbose=verbose,
@@ -109,6 +135,29 @@ def predict(model,
 
     return predictions
 
+
+def clear_model_cache(model=None):
+    """
+    Clear the cached model instances.
+
+    Parameters
+    ----------
+    model : tensorflow.keras.Model, optional
+        If provided, only clear the cache entry for this specific model.
+        If None (default), clear all cached models.
+
+    This is useful when:
+    - You're done using predict() with reuse_model=True and want to free memory
+    - The original model's architecture has changed and you need a fresh clone
+    """
+    global _model_cache
+    if model is not None:
+        model_id = id(model)
+        if model_id in _model_cache:
+            del _model_cache[model_id]
+    else:
+        _model_cache.clear()
+
 class KerasGA:
 
     def __init__(self, model, num_solutions):