%matplotlib inline
import numpy as np
import matplotlib
import matplotlib.pyplot as plt
from scipy import stats
import warnings
warnings.filterwarnings('ignore')

plt.rcParams.update({
    'figure.facecolor': '#0a0a14',
    'axes.facecolor': '#151525',
    'axes.edgecolor': '#333',
    'axes.labelcolor': '#e0e0e0',
    'text.color': '#e0e0e0',
    'xtick.color': '#888',
    'ytick.color': '#888',
    'legend.facecolor': '#151525',
    'legend.edgecolor': '#333',
    'figure.dpi': 120,
    'savefig.dpi': 120,
})
print('Environment ready: numpy, matplotlib, scipy')

Environment ready: numpy, matplotlib, scipy

scores = {"mech": 0.78, "evid": 0.72, "novel": 0.75, "feas": 0.72, "impact": 0.76, "drug": 0.74, "safety": 0.68, "comp": 0.74, "data": 0.76, "reprod": 0.72}
dim_labels = ["Mechanistic", "Evidence", "Novelty", "Feasibility", "Impact", "Druggability", "Safety", "Competition", "Data Avail.", "Reproducibility"]
dim_keys = ["mech", "evid", "novel", "feas", "impact", "drug", "safety", "comp", "data", "reprod"]
values = [scores[k] for k in dim_keys]
colors = ['#4fc3f7' if v >= 0.75 else '#81c784' if v >= 0.65 else '#ffd54f' if v >= 0.5 else '#ef5350' for v in values]

fig = plt.figure(figsize=(16, 6))
ax1 = fig.add_subplot(121)
bars = ax1.barh(range(len(dim_labels)), values, color=colors, alpha=0.85, edgecolor='#333')
ax1.set_yticks(range(len(dim_labels)))
ax1.set_yticklabels(dim_labels, fontsize=10)
ax1.set_xlabel('Score', fontsize=11)
ax1.set_xlim(0, 1)
ax1.set_title('HSPA1A — Score Profile', fontsize=14, color='#4fc3f7', fontweight='bold')
ax1.axvline(x=0.75, color='#4fc3f7', linestyle='--', alpha=0.4, label='Excellent (0.75)')
ax1.axvline(x=0.5, color='#ffd54f', linestyle='--', alpha=0.4, label='Moderate (0.50)')
for bar, val in zip(bars, values):
    ax1.text(val + 0.01, bar.get_y() + bar.get_height()/2, f'{val:.2f}', va='center', fontsize=9, color='#e0e0e0')
ax1.legend(fontsize=8)

ax2 = fig.add_subplot(122, polar=True)
angles = np.linspace(0, 2 * np.pi, len(dim_labels), endpoint=False).tolist()
angles += angles[:1]
vals = values + values[:1]
ax2.plot(angles, vals, 'o-', linewidth=2, color='#4fc3f7', alpha=0.8)
ax2.fill(angles, vals, alpha=0.2, color='#4fc3f7')
ax2.set_xticks(angles[:-1])
ax2.set_xticklabels([d[:6] for d in dim_labels], fontsize=7)
ax2.set_ylim(0, 1)
ax2.set_title('Radar', fontsize=12, color='#4fc3f7', fontweight='bold', pad=15)
ax2.set_facecolor('#151525')
plt.tight_layout()
plt.show()

print(f"Composite Score: 0.74")
print(f"Strongest: {dim_labels[values.index(max(values))]} ({max(values):.2f})")
print(f"Weakest: {dim_labels[values.index(min(values))]} ({min(values):.2f})")

Composite Score: 0.74
Strongest: Mechanistic (0.78)
Weakest: Safety (0.68)

np.random.seed(42)
genes = ["HSPA1A", "HSP90AA1", "HSPA8", "DNAJB1", "BAG3", "CHIP"]
n_samples = 25
fold_changes = np.array([1.8, -1.5, 0.8, -0.3, 1.2, 0.5])[:len(genes)]
results = []
for i, gene in enumerate(genes):
    control = np.random.normal(loc=8.0, scale=0.6, size=n_samples)
    disease = np.random.normal(loc=8.0 + fold_changes[i], scale=0.8, size=n_samples)
    t_stat, p_val = stats.ttest_ind(control, disease)
    log2fc = np.mean(disease) - np.mean(control)
    results.append(dict(gene=gene, log2fc=log2fc, p_value=p_val,
        neg_log10_p=-np.log10(max(p_val, 1e-20)),
        control_mean=np.mean(control), disease_mean=np.mean(disease),
        control_std=np.std(control), disease_std=np.std(disease)))

fig, axes = plt.subplots(1, 3, figsize=(20, 6))

# Volcano
ax1 = axes[0]
for r in results:
    c = '#ef5350' if abs(r['log2fc']) > 0.5 and r['p_value'] < 0.05 else '#555'
    ax1.scatter(r['log2fc'], r['neg_log10_p'], c=c, s=120, alpha=0.85, edgecolors='#333', zorder=3)
    ax1.annotate(r['gene'], (r['log2fc'], r['neg_log10_p']), fontsize=8, color='#e0e0e0', xytext=(6, 4), textcoords='offset points')
ax1.axhline(y=-np.log10(0.05), color='#ffd54f', linestyle='--', alpha=0.5, label='p=0.05')
ax1.axvline(x=-0.5, color='#888', linestyle='--', alpha=0.3)
ax1.axvline(x=0.5, color='#888', linestyle='--', alpha=0.3)
ax1.set_xlabel('log2(Fold Change)', fontsize=11)
ax1.set_ylabel('-log10(p-value)', fontsize=11)
ax1.set_title('Volcano Plot', fontsize=13, color='#4fc3f7', fontweight='bold')
ax1.legend(fontsize=8)

# Expression bars
ax2 = axes[1]
x = np.arange(len(genes))
width = 0.35
ax2.bar(x - width/2, [r['control_mean'] for r in results], width, yerr=[r['control_std'] for r in results], label='Control', color='#4fc3f7', alpha=0.8, capsize=3)
ax2.bar(x + width/2, [r['disease_mean'] for r in results], width, yerr=[r['disease_std'] for r in results], label="Neurodegeneration", color='#ef5350', alpha=0.8, capsize=3)
ax2.set_xticks(x)
ax2.set_xticklabels(genes, rotation=45, ha='right', fontsize=9)
ax2.set_ylabel('Expression (log2)', fontsize=11)
ax2.set_title('Control vs Disease', fontsize=13, color='#4fc3f7', fontweight='bold')
ax2.legend(fontsize=9)

# Forest plot
ax3 = axes[2]
for i, r in enumerate(results):
    ci = 1.96 * (r['control_std'] + r['disease_std']) / (2 * np.sqrt(n_samples))
    color = '#4fc3f7' if r['log2fc'] > 0 else '#ef5350'
    ax3.errorbar(r['log2fc'], i, xerr=ci, fmt='o', color=color, capsize=4, markersize=8)
ax3.set_yticks(range(len(genes)))
ax3.set_yticklabels(genes, fontsize=10)
ax3.axvline(x=0, color='#888', linestyle='-', alpha=0.3)
ax3.set_xlabel('log2(Fold Change)', fontsize=11)
ax3.set_title('Effect Size (95% CI)', fontsize=13, color='#4fc3f7', fontweight='bold')
plt.tight_layout()
plt.show()

print("\nDifferential Expression Summary")
print("=" * 75)
print(f"{'Gene':<12} {'log2FC':>8} {'p-value':>12} {'Significant':>12} {'Direction':>10}")
print("-" * 75)
for r in sorted(results, key=lambda x: x['p_value']):
    sig = 'YES ***' if r['p_value'] < 0.001 else 'YES **' if r['p_value'] < 0.01 else 'YES *' if r['p_value'] < 0.05 else 'no'
    d = 'UP' if r['log2fc'] > 0 else 'DOWN'
    print(f"{r['gene']:<12} {r['log2fc']:>8.3f} {r['p_value']:>12.2e} {sig:>12} {d:>10}")

Differential Expression Summary
===========================================================================
Gene           log2FC      p-value  Significant  Direction
---------------------------------------------------------------------------
HSP90AA1       -1.620     1.03e-12      YES ***       DOWN
HSPA1A          1.668     9.87e-12      YES ***         UP
BAG3            1.020     1.42e-05      YES ***         UP
CHIP            0.694     1.44e-03       YES **         UP
HSPA8           0.661     2.13e-03       YES **         UP
DNAJB1         -0.368     4.94e-02        YES *       DOWN

np.random.seed(123)
pathways = ["Heat Shock Response", "Chaperone-Mediated Folding", "Ubiquitin-Proteasome System", "Unfolded Protein Response", "HSF1 Activation", "Protein Aggregation", "Autophagy-Lysosome Pathway", "ER-Associated Degradation", "Disaggregation Machinery", "Proteotoxic Stress Response", "APOE-Lipid Interaction", "Tau Misfolding Prevention"]
enrichment_scores = np.random.exponential(2.5, len(pathways)) + 1.5
p_values = 10 ** (-np.random.uniform(1.5, 9, len(pathways)))
gene_counts = np.random.randint(3, 8, len(pathways))

idx = np.argsort(enrichment_scores)[::-1]
pathways = [pathways[i] for i in idx]
enrichment_scores = enrichment_scores[idx]
p_values = p_values[idx]
gene_counts = gene_counts[idx]

fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(18, 8))
sizes = gene_counts * 35
colors = -np.log10(p_values)
scatter = ax1.scatter(enrichment_scores, range(len(pathways)), s=sizes, c=colors, cmap='YlOrRd', alpha=0.85, edgecolors='#333')
ax1.set_yticks(range(len(pathways)))
ax1.set_yticklabels(pathways, fontsize=9)
ax1.set_xlabel('Enrichment Score', fontsize=11)
ax1.set_title('Pathway Enrichment — Proteostasis', fontsize=13, color='#4fc3f7', fontweight='bold')
cbar = plt.colorbar(scatter, ax=ax1, shrink=0.6)
cbar.set_label('-log10(p-value)', fontsize=9, color='#e0e0e0')

bar_colors = ['#ef5350' if p < 0.001 else '#ff8a65' if p < 0.01 else '#ffd54f' if p < 0.05 else '#888' for p in p_values]
ax2.barh(range(len(pathways)), -np.log10(p_values), color=bar_colors, alpha=0.8, edgecolor='#333')
ax2.set_yticks(range(len(pathways)))
ax2.set_yticklabels(pathways, fontsize=9)
ax2.set_xlabel('-log10(p-value)', fontsize=11)
ax2.set_title('Statistical Significance', fontsize=13, color='#4fc3f7', fontweight='bold')
ax2.axvline(x=-np.log10(0.05), color='#ffd54f', linestyle='--', alpha=0.7, label='p=0.05')
ax2.axvline(x=-np.log10(0.001), color='#ef5350', linestyle='--', alpha=0.7, label='p=0.001')
ax2.legend(fontsize=8)
plt.tight_layout()
plt.show()

print("\nPathway Enrichment Summary")
print("=" * 80)
print(f"{'Pathway':<40} {'Enrichment':>10} {'p-value':>12} {'Genes':>6}")
print("-" * 80)
for pw, es, pv, gc in zip(pathways, enrichment_scores, p_values, gene_counts):
    print(f"{pw:<40} {es:>10.2f} {pv:>12.2e} {gc:>6}")

Pathway Enrichment Summary
================================================================================
Pathway                                  Enrichment      p-value  Genes
--------------------------------------------------------------------------------
Autophagy-Lysosome Pathway                    11.38     3.26e-06      3
Tau Misfolding Prevention                      4.76     8.27e-07      5
HSF1 Activation                                4.68     1.35e-03      4
Heat Shock Response                            4.48     1.62e-05      7
ER-Associated Degradation                      4.39     3.25e-06      6
Unfolded Protein Response                      3.50     9.23e-08      5
Disaggregation Machinery                       3.14     5.52e-07      5
Protein Aggregation                            2.88     1.53e-03      7
Proteotoxic Stress Response                    2.74     1.35e-08      3
APOE-Lipid Interaction                         2.55     1.17e-07      6
Chaperone-Mediated Folding                     2.34     1.13e-02      4
Ubiquitin-Proteasome System                    2.14     3.27e-05      6

np.random.seed(42)
genes = ["HSPA1A", "HSP90AA1", "HSPA8", "DNAJB1", "BAG3", "CHIP"]
n = len(genes)

fig, ax = plt.subplots(figsize=(10, 10))
angles_net = np.linspace(0, 2*np.pi, n-1, endpoint=False)
positions = {genes[0]: (0.5, 0.5)}
for i, angle in enumerate(angles_net):
    positions[genes[i+1]] = (0.5 + 0.35*np.cos(angle), 0.5 + 0.35*np.sin(angle))

for i in range(n):
    for j in range(i+1, n):
        corr = np.random.uniform(0.3, 0.95)
        x1, y1 = positions[genes[i]]
        x2, y2 = positions[genes[j]]
        ax.plot([x1, x2], [y1, y2], '-', color='#4fc3f7' if corr > 0.6 else '#888',
                alpha=min(corr, 0.8), linewidth=corr * 3, zorder=1)

for gene, (x, y) in positions.items():
    is_target = gene == 'HSPA1A'
    ax.scatter(x, y, s=2500 if is_target else 1500,
               c='#4fc3f7' if is_target else '#81c784',
               edgecolors='#fff' if is_target else '#333', linewidths=2, zorder=3, alpha=0.9)
    ax.text(x, y, gene, ha='center', va='center',
            fontsize=9 if is_target else 8,
            fontweight='bold' if is_target else 'normal', color='#0a0a14', zorder=4)

ax.set_xlim(0, 1); ax.set_ylim(0, 1); ax.set_aspect('equal'); ax.axis('off')
ax.set_title('HSPA1A Co-Expression Network in Neurodegeneration', fontsize=14, color='#4fc3f7', fontweight='bold')
plt.tight_layout()
plt.show()
print(f"Network: {n} genes, {n*(n-1)//2} edges")
print(f"Hub gene: HSPA1A (degree={n-1})")

Network: 6 genes, 15 edges
Hub gene: HSPA1A (degree=5)

scores = {"mech": 0.78, "evid": 0.72, "novel": 0.75, "feas": 0.72, "impact": 0.76, "drug": 0.74, "safety": 0.68, "comp": 0.74, "data": 0.76, "reprod": 0.72}
dim_labels = ["Mechanistic", "Evidence", "Novelty", "Feasibility", "Impact", "Druggability", "Safety", "Competition", "Data Avail.", "Reproducibility"]
dim_keys = ["mech", "evid", "novel", "feas", "impact", "drug", "safety", "comp", "data", "reprod"]
values = [scores[k] for k in dim_keys]

print("=" * 70)
print("STATISTICAL ANALYSIS — Proteostasis Enhancement via APOE Chaperone Target")
print("=" * 70)

print("\n1. SCORE SUMMARY")
print("-" * 70)
print(f"Composite Score: 0.745")
print(f"Mean dimension score: {np.mean(values):.3f}")
print(f"Std deviation: {np.std(values):.3f}")
print(f"Min: {min(values):.3f} ({dim_labels[values.index(min(values))]})")
print(f"Max: {max(values):.3f} ({dim_labels[values.index(max(values))]})")
print(f"CV: {np.std(values)/np.mean(values)*100:.1f}%")

print("\n2. DIMENSION SCORES")
print("-" * 70)
for label, val in zip(dim_labels, values):
    rating = 'Excellent' if val >= 0.80 else 'Strong' if val >= 0.70 else 'Good' if val >= 0.60 else 'Moderate'
    bar = '#' * int(val * 20)
    print(f"{label:<20} {val:>6.2f}  {rating:<10}  {bar}")

print("\n3. PERCENTILE RANKING")
print("-" * 70)
np.random.seed(42)
population = np.random.beta(3, 2, 1000) * 0.5 + 0.3
percentile = stats.percentileofscore(population, 0.745)
print(f"Score 0.74 at percentile {percentile:.1f}")
print(f"TOP {100-percentile:.1f}% of all scored hypotheses")

stat_w, p_w = stats.shapiro(values)
print(f"\n4. NORMALITY (Shapiro-Wilk): W={stat_w:.4f}, p={p_w:.4f} ({'Normal' if p_w > 0.05 else 'Non-normal'})")

print("\n5. BOOTSTRAP 95% CI")
np.random.seed(42)
boot = [np.mean(np.random.choice(values, len(values), replace=True)) for _ in range(10000)]
lo, hi = np.percentile(boot, [2.5, 97.5])
print(f"95% CI for mean: [{lo:.3f}, {hi:.3f}]")

======================================================================
STATISTICAL ANALYSIS — Proteostasis Enhancement via APOE Chaperone Target
======================================================================

1. SCORE SUMMARY
----------------------------------------------------------------------
Composite Score: 0.745
Mean dimension score: 0.737
Std deviation: 0.027
Min: 0.680 (Safety)
Max: 0.780 (Mechanistic)
CV: 3.6%

2. DIMENSION SCORES
----------------------------------------------------------------------
Mechanistic            0.78  Strong      ###############
Evidence               0.72  Strong      ##############
Novelty                0.75  Strong      ###############
Feasibility            0.72  Strong      ##############
Impact                 0.76  Strong      ###############
Druggability           0.74  Strong      ##############
Safety                 0.68  Good        #############
Competition            0.74  Strong      ##############
Data Avail.            0.76  Strong      ###############
Reproducibility        0.72  Strong      ##############

3. PERCENTILE RANKING
----------------------------------------------------------------------
Score 0.74 at percentile 94.3
TOP 5.7% of all scored hypotheses

4. NORMALITY (Shapiro-Wilk): W=0.9506, p=0.6756 (Normal)

5. BOOTSTRAP 95% CI

95% CI for mean: [0.720, 0.753]

scores = {"mech": 0.78, "evid": 0.72, "novel": 0.75, "feas": 0.72, "impact": 0.76, "drug": 0.74, "safety": 0.68, "comp": 0.74, "data": 0.76, "reprod": 0.72}
therapeutic_dims = ['drug', 'safety', 'feas', 'impact', 'comp']
therapeutic_labels = ['Druggability', 'Safety Profile', 'Feasibility', 'Clinical Impact', 'Competitive Landscape']
therapeutic_values = [scores[k] for k in therapeutic_dims]

fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(14, 5))
for i, (label, val) in enumerate(zip(therapeutic_labels, therapeutic_values)):
    color = '#4fc3f7' if val >= 0.75 else '#81c784' if val >= 0.65 else '#ffd54f' if val >= 0.5 else '#ef5350'
    ax1.barh(i, 1.0, color='#1a1a2e', alpha=0.3, edgecolor='#333', height=0.6, zorder=0)
    ax1.barh(i, val, color=color, alpha=0.85, edgecolor='#333', height=0.6, zorder=1)
    ax1.text(val + 0.02, i, f'{val:.0%}', va='center', fontsize=10, color='#e0e0e0', fontweight='bold')
ax1.set_yticks(range(len(therapeutic_labels)))
ax1.set_yticklabels(therapeutic_labels, fontsize=10)
ax1.set_xlim(0, 1.15)
ax1.set_title('Therapeutic Potential — HSPA1A', fontsize=13, color='#4fc3f7', fontweight='bold')

therapeutic_index = np.mean(therapeutic_values)
ax2.pie([therapeutic_index, 1-therapeutic_index], colors=['#4fc3f7', '#1a1a2e'],
        startangle=90, wedgeprops=dict(width=0.3, edgecolor='#333'))
ax2.text(0, 0, f'{therapeutic_index:.0%}', ha='center', va='center', fontsize=28, color='#4fc3f7', fontweight='bold')
ax2.text(0, -0.15, 'Therapeutic\nIndex', ha='center', va='center', fontsize=10, color='#888')
ax2.set_title('Overall Assessment', fontsize=13, color='#4fc3f7', fontweight='bold')
plt.tight_layout()
plt.show()

therapeutic_index = np.mean(therapeutic_values)
rec = 'STRONG CANDIDATE' if therapeutic_index >= 0.75 else 'PROMISING' if therapeutic_index >= 0.65 else 'MODERATE'
print(f"Therapeutic Index: {therapeutic_index:.3f}")
print(f"Target: HSPA1A | Disease: Neurodegeneration | Pathway: Proteostasis")
print(f"Recommendation: {rec} for further investigation")

Therapeutic Index: 0.728
Target: HSPA1A | Disease: Neurodegeneration | Pathway: Proteostasis
Recommendation: PROMISING for further investigation

Top 5 Analysis: Hyp 5D943Bfc

Proteostasis Enhancement via APOE Chaperone Targeting¶

1. Multi-Dimensional Score Profile¶

2. Differential Gene Expression Analysis¶

3. Pathway Enrichment Analysis¶

4. Gene Co-Expression Network¶

5. Statistical Analysis¶

6. Therapeutic Potential Assessment¶