# % pip install numpy matplotlib pint solve_ivp_pint scipy

import numpy as np
import matplotlib.pyplot as plt
from pint import UnitRegistry
from solve_ivp_pint import solve_ivp
from scipy.optimize import minimize, differential_evolution
import time

ureg = UnitRegistry()
Q = ureg.Quantity
ureg.define('OD = [] = optical_density')

rng = np.random.default_rng(42)

def logistic_rhs(t, y, k, S0, X0):
    """Right-hand side of logistic ODE"""
    X = y[0]
    S = S0 + X0 - X
    dXdt = k * X * S
    return [dXdt]

def simulate_logistic(t_points, k, S0, X0):
    """Integrate the logistic growth ODE"""
    y0 = [X0]
    t_span = (t_points[0], t_points[-1])
    
    sol = solve_ivp(logistic_rhs, t_span, y0, args=(k, S0, X0),
                    t_eval=t_points, method='LSODA')
    
    y_list = sol.y[0]
    y_array = Q(np.array([y.m for y in y_list]), y_list[0].units)
    return y_array

print("Setup complete!")

Setup complete!

k_true = Q(0.5, 'hour**-1 / OD')
S0_true = Q(0.99, 'OD')
X0_true = Q(0.01, 'OD')
K_true = S0_true + X0_true

t_data = Q(np.linspace(0, 14, 30), 'hour')
y_true = simulate_logistic(t_data, k_true, S0_true, X0_true)
y_data = y_true + Q(rng.normal(0, 0.02, len(t_data)), 'OD')

plt.figure(figsize=(8, 5))
plt.plot(t_data.m, y_data.m, 'o', alpha=0.6, label='Noisy data')
plt.plot(t_data.m, y_true.m, 'r-', alpha=0.5, label='True curve')
plt.xlabel('Time (h)')
plt.ylabel('OD')
plt.title('Synthetic Growth Curve')
plt.legend()
plt.grid(True, alpha=0.3)
plt.show()

k_values = np.linspace(0.3, 0.7, 40)
K_values = np.linspace(0.7, 1.3, 40)

J = np.zeros((len(K_values), len(k_values)))
for i, K_val in enumerate(K_values):
    for j, k_val in enumerate(k_values):
        k_test = Q(k_val, 'hour**-1 / OD')
        K_test = Q(K_val, 'OD')
        S0_test = K_test - X0_true
        
        y_pred = simulate_logistic(t_data, k_test, S0_test, X0_true)
        J[i, j] = np.sum(((y_data - y_pred).m_as('OD'))**2)

plt.figure(figsize=(8, 6))
plt.contour(k_values, K_values, np.log10(J), levels=20, cmap='viridis')
plt.plot(k_true.m, K_true.m, 'r*', markersize=15, label='True parameters')
plt.xlabel(r'$k$ ($\mathrm{h}^{-1}~\mathrm{OD}^{-1}$)')
plt.ylabel(r'$K = S_0 + X_0$ ($\mathrm{OD}$)')
plt.title('Objective Function Landscape')
plt.colorbar(label=r'$\log_{10}(J)$')
plt.legend()
plt.show()

# Full curve: 0-14h (includes plateau)
t_full = Q(np.linspace(0, 14, 30), 'hour')
y_full = simulate_logistic(t_full, k_true, S0_true, X0_true)
y_full = y_full + Q(rng.normal(0, 0.02, len(t_full)), 'OD')

# Exponential only: 0-5h (no plateau)
t_exp_only = Q(np.linspace(0, 5, 15), 'hour')
y_exp_only = simulate_logistic(t_exp_only, k_true, S0_true, X0_true)
y_exp_only = y_exp_only + Q(rng.normal(0, 0.01, len(t_exp_only)), 'OD')

print(f"Full curve: max OD = {y_full.max().m:.3f}")
print(f"Exp-only: max OD = {y_exp_only.max().m:.3f} ({y_exp_only.max().m/K_true.m*100:.1f}% of K)")

# Compute landscapes for both
K_values_wide = np.linspace(0.7, 2.0, 40)

J_full = np.zeros((len(K_values), len(k_values)))
J_exp = np.zeros((len(K_values_wide), len(k_values)))

for i, K_val in enumerate(K_values):
    for j, k_val in enumerate(k_values):
        k_test = Q(k_val, 'hour**-1 / OD')
        K_test = Q(K_val, 'OD')
        S0_test = K_test - X0_true
        y_pred = simulate_logistic(t_full, k_test, S0_test, X0_true)
        J_full[i, j] = np.sum(((y_full - y_pred).m_as('OD'))**2)

for i, K_val in enumerate(K_values_wide):
    for j, k_val in enumerate(k_values):
        k_test = Q(k_val, 'hour**-1 / OD')
        K_test = Q(K_val, 'OD')
        S0_test = K_test - X0_true
        y_pred = simulate_logistic(t_exp_only, k_test, S0_test, X0_true)
        J_exp[i, j] = np.sum(((y_exp_only - y_pred).m_as('OD'))**2)

fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(14, 5))

ax1.contour(k_values, K_values, np.log10(J_full), levels=20, cmap='viridis')
ax1.plot(k_true.m, K_true.m, 'r*', markersize=15)
ax1.set_xlabel(r'$k$')
ax1.set_ylabel(r'$K$')
ax1.set_title('Full Growth Curve (0-14h)')
ax1.grid(True, alpha=0.3)

ax2.contour(k_values, K_values_wide, np.log10(J_exp), levels=20, cmap='viridis')
ax2.plot(k_true.m, K_true.m, 'r*', markersize=15)
ax2.set_xlabel(r'$k$')
ax2.set_ylabel(r'$K$')
ax2.set_title('Exponential Phase Only (0-5h)')
ax2.grid(True, alpha=0.3)

plt.tight_layout()
plt.show()

Full curve: max OD = 0.937
Exp-only: max OD = 0.111 (11.1% of K)

def objective(params, t_data, y_data):
    """Objective function in (μ, K, X0) parameterization"""
    mu, K, X0 = params
    
    if K <= 0 or X0 <= 0 or mu <= 0:
        return 1e10
    
    k = mu / K
    S0 = K - X0
    
    try:
        y_pred = simulate_logistic(t_data, Q(k, 'hour**-1 / OD'),
                                   Q(S0, 'OD'), Q(X0, 'OD'))
        residuals = (y_data - y_pred).m_as('OD')
        return np.sum(residuals**2)
    except:
        return 1e10

print("Objective function defined in (μ, K, X0) parameterization")

Objective function defined in (μ, K, X0) parameterization

initial_guess = [0.45, 0.95, 0.015]

t0 = time.time()
result_good = minimize(objective, initial_guess, args=(t_data, y_data),
                       method='L-BFGS-B', options={'maxiter': 500})
t_good = time.time() - t0

mu_fit, K_fit, X0_fit = result_good.x

print(f"Fitted parameters:")
print(f"  mu = {mu_fit:.4f} h⁻¹ (true: {(k_true * K_true).m:.4f})")
print(f"  K = {K_fit:.4f} OD (true: {K_true.m:.4f})")
print(f"  X0 = {X0_fit:.4f} OD (true: {X0_true.m:.4f})")
print(f"  Objective: {result_good.fun:.6f}")
print(f"  Time: {t_good:.2f}s")

y_fit = simulate_logistic(t_data, Q(mu_fit/K_fit, 'hour**-1 / OD'),
                         Q(K_fit - X0_fit, 'OD'), Q(X0_fit, 'OD'))

plt.figure(figsize=(8, 5))
plt.plot(t_data.m, y_data.m, 'o', alpha=0.6, label='Data')
plt.plot(t_data.m, y_fit.m, 'r-', linewidth=2, label='Fit')
plt.xlabel('Time (h)')
plt.ylabel('OD')
plt.legend()
plt.grid(True, alpha=0.3)
plt.show()

Fitted parameters:
  mu = 0.4937 h⁻¹ (true: 0.5000)
  K = 1.0122 OD (true: 1.0000)
  X0 = 0.0105 OD (true: 0.0100)
  Objective: 0.006840
  Time: 0.41s

n_trials = 10
rng_init = np.random.default_rng(123)
successes = 0

print("Testing gradient descent from random starting points:")
print("=" * 70)

for i in range(n_trials):
    mu_init = rng_init.uniform(0.05, 1.5)
    K_init = rng_init.uniform(0.2, 2.0)
    X0_init = rng_init.uniform(0.005, 0.1)
    
    result = minimize(objective, [mu_init, K_init, X0_init],
                     args=(t_data, y_data), method='L-BFGS-B',
                     options={'maxiter': 500})
    
    mu_r, K_r, X0_r = result.x
    
    mu_err = abs(mu_r - (k_true * K_true).m) / (k_true * K_true).m * 100
    K_err = abs(K_r - K_true.m) / K_true.m * 100
    X0_err = abs(X0_r - X0_true.m) / X0_true.m * 100
    
    success = mu_err < 10 and K_err < 10 and X0_err < 10
    if success:
        successes += 1
    
    status = "✓" if success else "✗"
    print(f"{status} Trial {i+1:2d}: mu={mu_r:.3f}, K={K_r:.3f}, X0={X0_r:.3f}, J={result.fun:.3f}")

print("=" * 70)
print(f"Success rate: {successes}/{n_trials} = {successes/n_trials*100:.0f}%")

Testing gradient descent from random starting points:
======================================================================
✗ Trial  1: mu=1.039, K=0.297, X0=0.026, J=2.343
✓ Trial  2: mu=0.494, K=1.012, X0=0.010, J=0.007
✗ Trial  3: mu=1.389, K=0.698, X0=0.083, J=1.791
✗ Trial  4: mu=1.340, K=1.123, X0=0.028, J=9.791
✗ Trial  5: mu=1.245, K=0.585, X0=0.075, J=1.704
✗ Trial  6: mu=0.963, K=1.869, X0=0.027, J=27.230
✗ Trial  7: mu=1.209, K=1.133, X0=0.027, J=8.826
✓ Trial  8: mu=0.494, K=1.012, X0=0.010, J=0.007
✓ Trial  9: mu=0.494, K=1.012, X0=0.010, J=0.007
✗ Trial 10: mu=1.106, K=1.853, X0=0.064, J=29.099
======================================================================
Success rate: 3/10 = 30%

bounds = [(0.01, 1.5),   # mu
          (0.1, 2.0),    # K
          (0.001, 0.1)]  # X0

t0 = time.time()
result_de = differential_evolution(objective, bounds, args=(t_data, y_data),
                                  strategy='best1bin', maxiter=300, seed=42)
t_de = time.time() - t0

mu_de, K_de, X0_de = result_de.x

print(f"Differential evolution:")
print(f"  mu = {mu_de:.4f} h⁻¹ (true: {(k_true * K_true).m:.4f})")
print(f"  K = {K_de:.4f} OD (true: {K_true.m:.4f})")
print(f"  X0 = {X0_de:.4f} OD (true: {X0_true.m:.4f})")
print(f"  Objective: {result_de.fun:.6f}")
print(f"  Time: {t_de:.2f}s")
print(f"  Function evaluations: {result_de.nfev}")
print(f"\nFound the answer without any initial guess, but took {t_de/t_good:.0f}× longer")

Differential evolution:
  mu = 0.4937 h⁻¹ (true: 0.5000)
  K = 1.0122 OD (true: 1.0000)
  X0 = 0.0105 OD (true: 0.0100)
  Objective: 0.006840
  Time: 8.85s
  Function evaluations: 1900

Found the answer without any initial guess, but took 22× longer

t0 = time.time()

# Quick global search (20 iterations)
result_de_quick = differential_evolution(objective, bounds, args=(t_data, y_data),
                                        maxiter=20, seed=42)

# Local refinement
result_final = minimize(objective, result_de_quick.x, args=(t_data, y_data),
                       method='L-BFGS-B', options={'maxiter': 500})

t_combined = time.time() - t0

mu_final, K_final, X0_final = result_final.x

print(f"Combined strategy (DE 20 iter + GD):")
print(f"  μ = {mu_final:.4f} h⁻¹")
print(f"  K = {K_final:.4f} OD")
print(f"  X₀ = {X0_final:.4f} OD")
print(f"  Objective: {result_final.fun:.6f}")
print(f"  Time: {t_combined:.2f}s")
print(f"\nComparison:")
print(f"  Gradient descent (good guess): {t_good:.2f}s")
print(f"  Differential evolution (full): {t_de:.2f}s")
print(f"  Combined strategy: {t_combined:.2f}s")
print(f"\nCombined is {t_de/t_combined:.1f}× faster than full DE")

Combined strategy (DE 20 iter + GD):
  μ = 0.4937 h⁻¹
  K = 1.0122 OD
  X₀ = 0.0105 OD
  Objective: 0.006840
  Time: 5.02s

Comparison:
  Gradient descent (good guess): 0.41s
  Differential evolution (full): 8.85s
  Combined strategy: 5.02s

Combined is 1.8× faster than full DE

with open('data/plate_reader.txt', 'r') as f:
    lines = f.readlines()

data_lines = [l.strip() for l in lines[1:] if l.strip() and not l.startswith('##')]
headers = data_lines[0].split('\t')

time_hours = []
well_data = {h: [] for h in headers[1:]}

for line in data_lines[1:]:
    parts = line.split('\t')
    time_str = parts[0]
    time_parts = time_str.split(':')
    total_hours = int(time_parts[0]) + int(time_parts[1])/60 + int(time_parts[2])/3600
    time_hours.append(total_hours)
    
    for i, header in enumerate(headers[1:], start=1):
        well_data[header].append(float(parts[i]))

time_hours = np.array(time_hours)

print(f"Loaded {len(time_hours)} time points from {len(headers)-1} wells")
print(f"Wells: {', '.join(headers[1:])}")

Loaded 313 time points from 8 wells
Wells: A1, B1, C1, D1, E1, F1, G1, H1

fig, ax = plt.subplots(figsize=(10, 6))
for well in headers[1:]:
    od = np.array(well_data[well])
    if well == 'A1':
        ax.plot(time_hours, od, 'k--', alpha=0.3, label='A1 (blank)')
    else:
        ax.plot(time_hours, od, marker='o', markersize=2, label=well, alpha=0.7)

ax.set_xlabel('Time (h)')
ax.set_ylabel('OD (600 nm)')
ax.set_title('Plate Reader Data')
ax.legend(bbox_to_anchor=(1.05, 1), loc='upper left')
ax.grid(True, alpha=0.3)
plt.tight_layout()
plt.show()

t_exp = Q(time_hours, 'hour')
od_exp = Q(np.array(well_data['D1']), 'OD')

def objective_exp(params):
    mu, K, X0 = params
    if K <= 0 or X0 <= 0 or mu <= 0:
        return 1e10
    k = mu / K
    S0 = K - X0
    try:
        y_pred = simulate_logistic(t_exp, Q(k, 'hour**-1 / OD'),
                                   Q(S0, 'OD'), Q(X0, 'OD'))
        return np.sum(((od_exp - y_pred).m_as('OD'))**2)
    except:
        return 1e10

bounds_exp = [(0.01, 2.0), (0.1, 2.0), (0.001, 0.1)]
result_de_exp = differential_evolution(objective_exp, bounds_exp, maxiter=20, seed=42)
result_exp = minimize(objective_exp, result_de_exp.x, method='L-BFGS-B')

mu_exp, K_exp, X0_exp = result_exp.x

print(f"Well D1 fit:")
print(f"  mu = {mu_exp:.3f} h⁻¹")
print(f"  K = {K_exp:.3f} OD")
print(f"  X0 = {X0_exp:.4f} OD")
print(f"  Objective: {result_exp.fun:.4f}")

Well D1 fit:
  mu = 0.286 h⁻¹
  K = 1.040 OD
  X0 = 0.1120 OD
  Objective: 0.4611

y_fit_exp = simulate_logistic(t_exp, Q(mu_exp/K_exp, 'hour**-1 / OD'),
                             Q(K_exp - X0_exp, 'OD'), Q(X0_exp, 'OD'))

fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(14, 5))

ax1.plot(t_exp.m, od_exp.m, 'o', markersize=2, alpha=0.5, label='Measured')
ax1.plot(t_exp.m, y_fit_exp.m, 'r-', linewidth=2, label='Logistic fit')
ax1.set_xlabel('Time (h)')
ax1.set_ylabel('OD')
ax1.set_title('Well D1: Logistic Model')
ax1.legend()
ax1.grid(True, alpha=0.3)

residuals = od_exp.m - y_fit_exp.m
ax2.plot(t_exp.m, residuals, 'o', markersize=2)
ax2.axhline(0, color='k', linestyle='--', alpha=0.3)
ax2.set_xlabel('Time (h)')
ax2.set_ylabel('Residual (OD)')
ax2.set_title('Residuals')
ax2.grid(True, alpha=0.3)

plt.tight_layout()
plt.show()

def two_resource_model(t, y, k1, k2, S1_0, S2_0, X_0):
    """Two parallel substrates supporting growth"""
    X, S1, S2 = y
    dXdt = k1 * X * S1 + k2 * X * S2
    dS1dt = -k1 * X * S1
    dS2dt = -k2 * X * S2
    return [dXdt, dS1dt, dS2dt]

def simulate_two_resource(t_points, k1, k2, S1_0, S2_0, X_0):
    """Simulate 2-resource growth with pint units"""
    y0 = [X_0, S1_0, S2_0]
    t_span = (t_points[0], t_points[-1])
    
    sol = solve_ivp(
        two_resource_model,
        t_span,
        y0,
        args=(k1, k2, S1_0, S2_0, X_0),
        t_eval=t_points,
        method='LSODA'
    )
    
    # Extract X (first component)
    X_list = sol.y[0]
    X_array = Q(np.array([X.m for X in X_list]), X_list[0].units)
    return X_array

t_exp_b1 = Q(time_hours, 'hour')
od_exp_b1 = Q(np.array(well_data['B1']), 'OD')

# Fit single-resource
def objective_single(params):
    mu, K, X0 = params
    if K <= 0 or X0 <= 0 or mu <= 0:
        return 1e10
    k = mu / K
    S0 = K - X0
    try:
        y_pred = simulate_logistic(t_exp_b1, Q(k, 'hour**-1 / OD'),
                                   Q(S0, 'OD'), Q(X0, 'OD'))
        return np.sum(((od_exp_b1 - y_pred).m_as('OD'))**2)
    except:
        return 1e10

result_single = minimize(objective_single, [0.5, 1.0, 0.015],
                        method='L-BFGS-B', options={'maxiter': 1000})
mu_s, K_s, X0_s = result_single.x
print(f'{mu_s=:.3f}, {K_s=:.3f}, {X0_s=:.3f}')

# Fit two-resource
def objective_two(params):
    mu1, mu2, K1, K2, X0 = params
    if any(p <= 0 for p in params):
        return 1e10
    k1, k2 = mu1/K1, mu2/K2
    S1_0, S2_0 = K1 - X0, K2 - X0
    try:
        y_pred = simulate_two_resource(t_exp_b1, Q(k1, 'hour**-1 / OD'), Q(k2, 'hour**-1 / OD'),
                                       Q(S1_0, 'OD'), Q(S2_0, 'OD'), Q(X0, 'OD'))
        return np.sum(((od_exp_b1 - y_pred).m_as('OD'))**2)
    except:
        return 1e10

result_two = minimize(objective_two, [0.4, 0.3, 0.5, 0.5, 0.015],
                     method='L-BFGS-B', options={'maxiter': 2000})
mu1_t, mu2_t, K1_t, K2_t, X0_t = result_two.x
print(f'{mu1_t=:.3f}, {mu2_t=:.3f}, {K1_t=:.3f}, {K2_t=:.3f}, {X0_t=:.3f}')

mu_s=0.249, K_s=1.099, X0_s=0.120
mu1_t=0.791, mu2_t=0.168, K1_t=0.241, K2_t=0.922, X0_t=0.030

k_s = mu_s / K_s
S0_s = K_s - X0_s
y_single = simulate_logistic(t_exp_b1, Q(k_s, 'hour**-1 / OD'),
                            Q(S0_s, 'OD'), Q(X0_s, 'OD'))

k1_t, k2_t = mu1_t/K1_t, mu2_t/K2_t
S1_0_t, S2_0_t = K1_t - X0_t, K2_t - X0_t
y_two = simulate_two_resource(t_exp_b1, Q(k1_t, 'hour**-1 / OD'), Q(k2_t, 'hour**-1 / OD'),
                              Q(S1_0_t, 'OD'), Q(S2_0_t, 'OD'), Q(X0_t, 'OD'))

fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(14, 5))

ax1.plot(t_exp_b1.m, od_exp_b1.m, 'o', markersize=2, alpha=0.5, label='Data')
ax1.plot(t_exp_b1.m, y_single.m, 'r-', linewidth=2, label='Single-resource')
ax1.plot(t_exp_b1.m, y_two.m, 'b-', linewidth=2, label='Two-resource')
ax1.set_xlabel('Time (h)')
ax1.set_ylabel('OD')
ax1.set_title('Well B1: Model Comparison')
ax1.legend()

residuals_single = (od_exp_b1 - y_single).m
residuals_two = (od_exp_b1 - y_two).m

ax2.plot(t_exp_b1.m, residuals_single, 'r-', alpha=0.5, label='Single')
ax2.plot(t_exp_b1.m, residuals_two, 'b-', alpha=0.5, label='Two')
ax2.axhline(0, color='k', linestyle='--', alpha=0.3)
ax2.set_xlabel('Time (h)')
ax2.set_ylabel('Residual (OD)')
ax2.set_title('Residuals')
ax2.legend()

plt.tight_layout()
plt.show()

Parameter Estimation¶

The logistic growth model¶

The objective function¶

Implementation with units¶

The optimization landscape¶

Identifiability: when your data doesn't tell you enough¶

Reparameterization: choosing better variables¶

Gradient descent: fast but fragile¶

Global optimization: differential evolution¶

Combined strategy: get both¶

Experimental data¶

Model extensions: two parallel resources¶

Summary¶