from pathlib import Path
import sys
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import matplotlib.image as mpimg
from IPython.display import display

NOTEBOOK_DIR = Path.cwd().resolve()
ROOT = NOTEBOOK_DIR if (NOTEBOOK_DIR / 'data').exists() else NOTEBOOK_DIR.parent
DATA_DIR = ROOT / 'data'
OUTPUT_DIR = ROOT / 'outputs'

python_executable = Path(sys.executable)
if 'qaoa' not in str(python_executable).lower():
    raise RuntimeError(
        f'This study must be executed from the qaoa conda environment. Active interpreter: {python_executable}'
    )

plt.rcParams.update({
    'figure.figsize': (12, 6),
    'axes.grid': True,
    'grid.alpha': 0.25,
    'axes.spines.top': False,
    'axes.spines.right': False,
    'font.size': 11,
    'axes.titlesize': 13,
    'axes.labelsize': 11,
})

PALETTE = {
    'navy': '#0f172a',
    'blue': '#2563eb',
    'teal': '#0f766e',
    'gold': '#b45309',
    'red': '#b91c1c',
    'slate': '#475569',
}

combined_summary = pd.read_csv(OUTPUT_DIR / 'combined_summary.csv')
combined_arch = pd.read_csv(OUTPUT_DIR / 'combined_arch_grid.csv')
combined_noise = pd.read_csv(OUTPUT_DIR / 'combined_noise_robustness.csv')
combined_scaling = pd.read_csv(OUTPUT_DIR / 'combined_scaling_matrix.csv')
application_domains = pd.read_csv(DATA_DIR / 'quantum_application_domains.csv')

def load_png(name: str):
    return mpimg.imread(OUTPUT_DIR / name)

best_arch_row = combined_arch.melt(id_vars='n_layers', var_name='width', value_name='rel_l2').sort_values('rel_l2').iloc[0]
summary_df = pd.DataFrame({
    'artifact': [
        'Best shared architecture',
        'Best shared rel-L2',
        'Noise robustness span',
        'Active interpreter',
    ],
    'value': [
        f"{int(best_arch_row['n_layers'])} layers x {best_arch_row['width']}",
        f"{best_arch_row['rel_l2']:.6e}",
        f"{combined_noise['rel_l2'].max() - combined_noise['rel_l2'].min():.6e}",
        str(python_executable),
    ],
})
display(summary_df)

feature_matrix = pd.DataFrame(
    {
        'Single-benchmark reporting': [0, 0, 0, 0, 0],
        'Shared formulation': [1, 1, 1, 1, 1],
    },
    index=[
        'Unified multi-problem harness',
        'Architecture grid study',
        'Scaling study',
        'Noise robustness sweep',
        'Specialist vs transfer framing',
    ],
)

summary_plot = combined_summary.copy()
summary_plot['rel_l2'] = pd.to_numeric(summary_plot['rel_l2'], errors='coerce')
summary_plot['wall_s'] = pd.to_numeric(summary_plot['wall_s'], errors='coerce')
finite_summary = summary_plot.dropna(subset=['rel_l2']).sort_values('rel_l2')

fig, axes = plt.subplots(1, 2, figsize=(14, 5))
axes[0].imshow(feature_matrix.values, cmap='Blues', vmin=0, vmax=1)
axes[0].set_xticks(range(feature_matrix.shape[1]), feature_matrix.columns, rotation=15)
axes[0].set_yticks(range(feature_matrix.shape[0]), feature_matrix.index)
axes[0].set_title('Comparative Components Beyond a Single Benchmark')
for row_index in range(feature_matrix.shape[0]):
    for col_index in range(feature_matrix.shape[1]):
        axes[0].text(
            col_index,
            row_index,
            'Yes' if feature_matrix.iloc[row_index, col_index] else 'No',
            ha='center',
            va='center',
            color='white' if feature_matrix.iloc[row_index, col_index] else PALETTE['navy'],
            fontsize=10,
            fontweight='bold',
        )

axes[1].barh(
    finite_summary['problem'],
    finite_summary['rel_l2'],
    color=[PALETTE['blue'], PALETTE['teal'], PALETTE['gold']],
    edgecolor='black',
)
axes[1].set_title('Shared-Protocol Relative L2 by Problem With Available References')
axes[1].set_xlabel('Relative L2 error')
for patch, value in zip(axes[1].patches, finite_summary['rel_l2']):
    axes[1].text(value + 0.005, patch.get_y() + patch.get_height() / 2, f'{value:.3f}', va='center')
plt.tight_layout()

display(summary_plot.round(6))

fig, ax = plt.subplots(figsize=(18, 4.6))
ax.axis('off')
table = ax.table(
    cellText=application_domains.values,
    colLabels=application_domains.columns,
    colWidths=[0.2, 0.4, 0.4],
    loc='center',
    cellLoc='left',
)
table.auto_set_font_size(False)
table.set_fontsize(9)
table.scale(1, 1.8)
ax.set_title('Benchmark Families and Real Scientific Domains', pad=18)
plt.tight_layout()

display(application_domains)

arch_long = combined_arch.melt(id_vars='n_layers', var_name='width', value_name='rel_l2')
arch_pivot = arch_long.pivot(index='n_layers', columns='width', values='rel_l2')
scaling_matrix = combined_scaling.set_index('n_col')

fig, axes = plt.subplots(1, 3, figsize=(16, 4.5))

arch_im = axes[0].imshow(arch_pivot.values, cmap='viridis_r')
axes[0].set_xticks(range(len(arch_pivot.columns)), arch_pivot.columns)
axes[0].set_yticks(range(len(arch_pivot.index)), arch_pivot.index)
axes[0].set_title('Architecture Grid: Relative L2')
axes[0].set_xlabel('Width')
axes[0].set_ylabel('Layers')
fig.colorbar(arch_im, ax=axes[0], fraction=0.046)

scale_im = axes[1].imshow(scaling_matrix.values, cmap='magma_r')
axes[1].set_xticks(range(len(scaling_matrix.columns)), scaling_matrix.columns)
axes[1].set_yticks(range(len(scaling_matrix.index)), scaling_matrix.index)
axes[1].set_title('Collocation vs Budget Matrix')
axes[1].set_xlabel('Epoch budget')
axes[1].set_ylabel('Collocation points')
fig.colorbar(scale_im, ax=axes[1], fraction=0.046)

axes[2].plot(
    combined_noise['noise_amp'],
    combined_noise['rel_l2'],
    marker='o',
    color=PALETTE['red'],
    linewidth=2,
 )
axes[2].set_title('Noise Robustness Sweep')
axes[2].set_xlabel('Noise amplitude')
axes[2].set_ylabel('Relative L2 error')
plt.tight_layout()

display(arch_long.sort_values('rel_l2').round(6))

image_specs = [
    ('Benchmark summary', 'combined_benchmark.png'),
    ('Architecture grid', 'combined_arch_grid.png'),
    ('Scaling study', 'combined_scaling_study.png'),
    ('Noise robustness', 'combined_noise_study.png'),
    ('Summary bar chart', 'combined_summary_barchart.png'),
]

fig, axes = plt.subplots(3, 2, figsize=(14, 15))
for axis, (title, image_name) in zip(axes.ravel(), image_specs):
    axis.imshow(load_png(image_name))
    axis.set_title(title)
    axis.axis('off')
axes[-1, -1].axis('off')
plt.tight_layout()

ranked_arch = arch_long.sort_values('rel_l2').reset_index(drop=True)
noise_span = combined_noise['rel_l2'].max() - combined_noise['rel_l2'].min()

fig, axes = plt.subplots(1, 2, figsize=(14, 5))

axes[0].bar(
    ranked_arch.index[:6].astype(str),
    ranked_arch['rel_l2'].iloc[:6],
    color=PALETTE['teal'],
    edgecolor='black',
)
axes[0].set_title('Top Shared Architectures')
axes[0].set_xlabel('Architecture rank')
axes[0].set_ylabel('Relative L2 error')

axes[1].bar(
    ['Noise span', 'Best rel-L2', 'Worst rel-L2'],
    [noise_span, combined_noise['rel_l2'].min(), combined_noise['rel_l2'].max()],
    color=[PALETTE['red'], PALETTE['blue'], PALETTE['gold']],
    edgecolor='black',
)
axes[1].set_title('Robustness Summary')
axes[1].set_ylabel('Relative L2 error')
plt.tight_layout()

display(ranked_arch.round(6).head(6))

Practice	Standard PINN reporting	This study
Protocol	Problem-specific	Unified multi-problem harness
Architecture selection	Per-benchmark tuning	Shared two-dimensional grid search
Compute effects	Unreported or implicit	Explicit collocation–budget matrix
Noise sensitivity	Absent	Robustness sweep
Framing	One-benchmark win	Specialist vs. transfer distinction

	problem	E_pinn	E_exact	delta_E	rel_l2	l_inf	wall_s
0	QHO (n=0)	0.549757	0.5000	0.049757	0.119626	0.073916	2.574739
1	QHO (n=1)	1.560837	1.5000	0.060837	0.136409	0.082964	2.797884
2	Anharmonic	0.572822	0.5375	0.035322	NaN	NaN	2.687483
3	Double Well	0.237697	NaN	NaN	NaN	NaN	3.289648

	benchmark_family	representative_system_class	why_transfer_matters
0	Harmonic confinement	molecular vibrations and trapped-ion motional ...	tests baseline eigenstate recovery under local...
1	Anharmonic confinement	bond-stretching and nonlinear confinement models	tests transfer beyond exactly solvable quadrat...
2	Double-well tunneling	ammonia inversion and coupled quantum dots	tests multi-basin optimization and symmetry-se...
3	Time-dependent transport	electron neutron and cold-atom wavepacket prop...	tests whether stationary PINN design principle...

	n_layers	width	rel_l2
5	5	64	0.265847
4	3	64	0.694198
2	5	32	0.884320
1	3	32	1.274440
0	2	32	1.362821
3	2	64	1.419319

	n_layers	width	rel_l2
0	5	64	0.265847
1	3	64	0.694198
2	5	32	0.884320
3	3	32	1.274440
4	2	32	1.362821
5	2	64	1.419319

Transferable Quantum PINNs Under a Unified Benchmark: Architecture, Scaling, and Robustness¶

Abstract¶

Contributions to the Paper¶

§ 1. Comparative Methodology¶

Distinction From Standard PINN Reporting¶

§ 2. Application Motivation¶

Role of the Anchor Dataset¶

3. Experimental Protocol and Evaluation Criteria¶

Evaluation Logic¶

4. Results and Visual Evidence¶

How to Read the Figures¶

5. Paper-Level Interpretation¶

What This Section Contributes¶

Scientific Relevance¶

Limitations Worth Stating Explicitly¶

	artifact	value
0	Best shared architecture	5 layers x 64
1	Best shared rel-L2	2.658472e-01
2	Noise robustness span	6.189807e-03
3	Active interpreter	/Users/mohuyn/miniforge3/envs/qaoa/bin/python