# Setup
import numpy as np
import matplotlib.pyplot as plt
from scipy import stats
import warnings
warnings.filterwarnings('ignore')
print('Environment ready.')

Environment ready.

import pandas as pd

hyp_data = [{"title": "Context-Dependent CRISPR Activation in Specific Neuronal Subtypes", "gene": "Cell-type promoters", "composite": 0.6, "mech": 0.65, "evid": 0.55, "novel": 0.65, "feas": 0.5, "impact": 0.65, "drug": 0.55, "safety": 0.5, "comp": 0.6, "data": 0.6, "reprod": 0.55}, {"title": "Trinucleotide Repeat Sequestration via CRISPR-Guided RNA Targeting", "gene": "HTT/DMPK", "composite": 0.54, "mech": 0.6, "evid": 0.5, "novel": 0.6, "feas": 0.45, "impact": 0.6, "drug": 0.5, "safety": 0.45, "comp": 0.55, "data": 0.5, "reprod": 0.45}, {"title": "Cholesterol-CRISPR Convergence Therapy", "gene": "HMGCR/LDLR/APOE", "composite": 0.54, "mech": 0.6, "evid": 0.5, "novel": 0.6, "feas": 0.45, "impact": 0.55, "drug": 0.5, "safety": 0.45, "comp": 0.55, "data": 0.55, "reprod": 0.45}, {"title": "Epigenetic Memory Reprogramming for AD", "gene": "BDNF/CREB1", "composite": 0.48, "mech": 0.55, "evid": 0.45, "novel": 0.55, "feas": 0.4, "impact": 0.5, "drug": 0.45, "safety": 0.4, "comp": 0.5, "data": 0.45, "reprod": 0.4}, {"title": "Metabolic Reprogramming via Multi-Gene CRISPR Circuits", "gene": "PGC1A/SIRT1/FOXO3", "composite": 0.44, "mech": 0.5, "evid": 0.4, "novel": 0.55, "feas": 0.35, "impact": 0.45, "drug": 0.4, "safety": 0.35, "comp": 0.45, "data": 0.4, "reprod": 0.35}, {"title": "Programmable Neuronal Circuit Repair via Epigenetic CRISPR", "gene": "NURR1/PITX3", "composite": 0.37, "mech": 0.4, "evid": 0.35, "novel": 0.5, "feas": 0.3, "impact": 0.4, "drug": 0.3, "safety": 0.3, "comp": 0.35, "data": 0.35, "reprod": 0.3}, {"title": "Multi-Modal CRISPR Platform for Simultaneous Editing and Monitoring", "gene": "Reporter systems", "composite": 0.37, "mech": 0.4, "evid": 0.35, "novel": 0.5, "feas": 0.3, "impact": 0.4, "drug": 0.3, "safety": 0.3, "comp": 0.35, "data": 0.35, "reprod": 0.3}]

df = pd.DataFrame(hyp_data)
df = df.rename(columns={'title': 'Hypothesis', 'gene': 'Target Gene', 'composite': 'Score'})
df[['Hypothesis', 'Target Gene', 'Score', 'mech', 'evid', 'novel', 'feas', 'impact', 'drug']]

import numpy as np
import matplotlib.pyplot as plt

plt.rcParams.update({
    'figure.facecolor': '#0a0a14',
    'axes.facecolor': '#151525',
    'text.color': '#e0e0e0',
    'axes.labelcolor': '#e0e0e0',
    'xtick.color': '#888',
    'ytick.color': '#888',
})

hyp_data = [{"title": "Context-Dependent CRISPR Activation in Specific Neuronal Subtypes", "gene": "Cell-type promoters", "composite": 0.6, "mech": 0.65, "evid": 0.55, "novel": 0.65, "feas": 0.5, "impact": 0.65, "drug": 0.55, "safety": 0.5, "comp": 0.6, "data": 0.6, "reprod": 0.55}, {"title": "Trinucleotide Repeat Sequestration via CRISPR-Guided RNA Targeting", "gene": "HTT/DMPK", "composite": 0.54, "mech": 0.6, "evid": 0.5, "novel": 0.6, "feas": 0.45, "impact": 0.6, "drug": 0.5, "safety": 0.45, "comp": 0.55, "data": 0.5, "reprod": 0.45}, {"title": "Cholesterol-CRISPR Convergence Therapy", "gene": "HMGCR/LDLR/APOE", "composite": 0.54, "mech": 0.6, "evid": 0.5, "novel": 0.6, "feas": 0.45, "impact": 0.55, "drug": 0.5, "safety": 0.45, "comp": 0.55, "data": 0.55, "reprod": 0.45}, {"title": "Epigenetic Memory Reprogramming for AD", "gene": "BDNF/CREB1", "composite": 0.48, "mech": 0.55, "evid": 0.45, "novel": 0.55, "feas": 0.4, "impact": 0.5, "drug": 0.45, "safety": 0.4, "comp": 0.5, "data": 0.45, "reprod": 0.4}, {"title": "Metabolic Reprogramming via Multi-Gene CRISPR Circuits", "gene": "PGC1A/SIRT1/FOXO3", "composite": 0.44, "mech": 0.5, "evid": 0.4, "novel": 0.55, "feas": 0.35, "impact": 0.45, "drug": 0.4, "safety": 0.35, "comp": 0.45, "data": 0.4, "reprod": 0.35}, {"title": "Programmable Neuronal Circuit Repair via Epigenetic CRISPR", "gene": "NURR1/PITX3", "composite": 0.37, "mech": 0.4, "evid": 0.35, "novel": 0.5, "feas": 0.3, "impact": 0.4, "drug": 0.3, "safety": 0.3, "comp": 0.35, "data": 0.35, "reprod": 0.3}, {"title": "Multi-Modal CRISPR Platform for Simultaneous Editing and Monitoring", "gene": "Reporter systems", "composite": 0.37, "mech": 0.4, "evid": 0.35, "novel": 0.5, "feas": 0.3, "impact": 0.4, "drug": 0.3, "safety": 0.3, "comp": 0.35, "data": 0.35, "reprod": 0.3}]

fig, ax = plt.subplots(figsize=(14, 6))
titles = [h['title'][:40] for h in hyp_data]
scores = [h.get('composite', 0) for h in hyp_data]
colors = ['#4fc3f7' if s >= 0.5 else '#ff8a65' if s >= 0.4 else '#ef5350' for s in scores]

bars = ax.barh(range(len(titles)), scores, color=colors, alpha=0.85, edgecolor='#333')
ax.set_yticks(range(len(titles)))
ax.set_yticklabels(titles, fontsize=9)
ax.set_xlabel('Composite Score', fontsize=11)
ax.set_xlim(0, 1)
ax.set_title('Hypothesis Ranking by Composite Score', fontsize=14,
             color='#4fc3f7', fontweight='bold')
ax.axvline(x=0.5, color='#81c784', linestyle='--', alpha=0.5, label='Strong threshold')
ax.axvline(x=0.4, color='#ffd54f', linestyle='--', alpha=0.5, label='Moderate threshold')
ax.legend(fontsize=8, facecolor='#151525', edgecolor='#333', labelcolor='#e0e0e0')

for bar, score in zip(bars, scores):
    ax.text(score + 0.01, bar.get_y() + bar.get_height()/2, f'{score:.3f}',
            va='center', fontsize=9, color='#e0e0e0')

plt.tight_layout()
plt.show()

import numpy as np
import matplotlib.pyplot as plt

plt.rcParams.update({
    'figure.facecolor': '#0a0a14',
    'axes.facecolor': '#151525',
    'axes.edgecolor': '#333',
    'axes.labelcolor': '#e0e0e0',
    'text.color': '#e0e0e0',
    'xtick.color': '#888',
    'ytick.color': '#888',
})

hyp_data = [{"title": "Context-Dependent CRISPR Activation in Specific Neuronal Subtypes", "gene": "Cell-type promoters", "composite": 0.6, "mech": 0.65, "evid": 0.55, "novel": 0.65, "feas": 0.5, "impact": 0.65, "drug": 0.55, "safety": 0.5, "comp": 0.6, "data": 0.6, "reprod": 0.55}, {"title": "Trinucleotide Repeat Sequestration via CRISPR-Guided RNA Targeting", "gene": "HTT/DMPK", "composite": 0.54, "mech": 0.6, "evid": 0.5, "novel": 0.6, "feas": 0.45, "impact": 0.6, "drug": 0.5, "safety": 0.45, "comp": 0.55, "data": 0.5, "reprod": 0.45}, {"title": "Cholesterol-CRISPR Convergence Therapy", "gene": "HMGCR/LDLR/APOE", "composite": 0.54, "mech": 0.6, "evid": 0.5, "novel": 0.6, "feas": 0.45, "impact": 0.55, "drug": 0.5, "safety": 0.45, "comp": 0.55, "data": 0.55, "reprod": 0.45}, {"title": "Epigenetic Memory Reprogramming for AD", "gene": "BDNF/CREB1", "composite": 0.48, "mech": 0.55, "evid": 0.45, "novel": 0.55, "feas": 0.4, "impact": 0.5, "drug": 0.45, "safety": 0.4, "comp": 0.5, "data": 0.45, "reprod": 0.4}, {"title": "Metabolic Reprogramming via Multi-Gene CRISPR Circuits", "gene": "PGC1A/SIRT1/FOXO3", "composite": 0.44, "mech": 0.5, "evid": 0.4, "novel": 0.55, "feas": 0.35, "impact": 0.45, "drug": 0.4, "safety": 0.35, "comp": 0.45, "data": 0.4, "reprod": 0.35}, {"title": "Programmable Neuronal Circuit Repair via Epigenetic CRISPR", "gene": "NURR1/PITX3", "composite": 0.37, "mech": 0.4, "evid": 0.35, "novel": 0.5, "feas": 0.3, "impact": 0.4, "drug": 0.3, "safety": 0.3, "comp": 0.35, "data": 0.35, "reprod": 0.3}, {"title": "Multi-Modal CRISPR Platform for Simultaneous Editing and Monitoring", "gene": "Reporter systems", "composite": 0.37, "mech": 0.4, "evid": 0.35, "novel": 0.5, "feas": 0.3, "impact": 0.4, "drug": 0.3, "safety": 0.3, "comp": 0.35, "data": 0.35, "reprod": 0.3}]

dimensions = ['Mechanistic', 'Evidence', 'Novelty', 'Feasibility', 'Impact',
              'Druggability', 'Safety', 'Competition', 'Data Avail.', 'Reproducibility']
dim_keys = ['mech', 'evid', 'novel', 'feas', 'impact', 'drug', 'safety', 'comp', 'data', 'reprod']

fig, ax = plt.subplots(figsize=(10, 8), subplot_kw=dict(polar=True))
angles = np.linspace(0, 2 * np.pi, len(dimensions), endpoint=False).tolist()
angles += angles[:1]

colors = ['#4fc3f7', '#81c784', '#ff8a65', '#ce93d8', '#ffd54f']
for i, h in enumerate(hyp_data[:5]):
    values = [h.get(k, 0) for k in dim_keys]
    values += values[:1]
    ax.plot(angles, values, 'o-', linewidth=2, color=colors[i % len(colors)],
            label=h['title'][:35], alpha=0.8)
    ax.fill(angles, values, alpha=0.1, color=colors[i % len(colors)])

ax.set_xticks(angles[:-1])
ax.set_xticklabels(dimensions, fontsize=8)
ax.set_ylim(0, 1)
ax.set_title('Hypothesis Score Radar', fontsize=14, color='#4fc3f7',
             fontweight='bold', pad=20)
ax.legend(loc='upper right', bbox_to_anchor=(1.3, 1.1), fontsize=7,
          facecolor='#151525', edgecolor='#333', labelcolor='#e0e0e0')
plt.tight_layout()
plt.show()

import numpy as np
import matplotlib.pyplot as plt
from scipy import stats

plt.rcParams.update({
    'figure.facecolor': '#0a0a14',
    'axes.facecolor': '#151525',
    'text.color': '#e0e0e0',
    'axes.labelcolor': '#e0e0e0',
    'xtick.color': '#888',
    'ytick.color': '#888',
})

fc_data = {"HTT": 0.3, "SOD1": 1.5, "APP": 1.2, "APOE": 1.8, "SNCA": 2.1, "GBA1": -1.3, "MAPT": 1.9, "BDNF": -1.1}
genes = list(fc_data.keys())
np.random.seed(42)

n_samples = 20
results = []
for gene in genes:
    fc = fc_data[gene]
    control = np.random.normal(loc=8.0, scale=0.8, size=n_samples)
    disease = np.random.normal(loc=8.0 + fc, scale=1.0, size=n_samples)
    t_stat, p_val = stats.ttest_ind(control, disease)
    log2fc = np.mean(disease) - np.mean(control)
    results.append({
        'gene': gene, 'log2fc': log2fc, 'p_value': p_val,
        'neg_log10_p': -np.log10(max(p_val, 1e-10)),
        'control_mean': np.mean(control), 'disease_mean': np.mean(disease),
    })

fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(16, 6))

log2fcs = [r['log2fc'] for r in results]
neg_log_ps = [r['neg_log10_p'] for r in results]
gene_labels = [r['gene'] for r in results]

colors = ['#ef5350' if abs(fc) > 0.5 and nlp > 1.3 else '#888888'
          for fc, nlp in zip(log2fcs, neg_log_ps)]

ax1.scatter(log2fcs, neg_log_ps, c=colors, s=100, alpha=0.8, edgecolors='#333')
for i, gene in enumerate(gene_labels):
    ax1.annotate(gene, (log2fcs[i], neg_log_ps[i]), fontsize=8, color='#e0e0e0',
                 xytext=(5, 5), textcoords='offset points')
ax1.axhline(y=1.3, color='#ffd54f', linestyle='--', alpha=0.5, label='p=0.05')
ax1.axvline(x=-0.5, color='#888', linestyle='--', alpha=0.3)
ax1.axvline(x=0.5, color='#888', linestyle='--', alpha=0.3)
ax1.set_xlabel('log2(Fold Change)', fontsize=11)
ax1.set_ylabel('-log10(p-value)', fontsize=11)
ax1.set_title('Volcano Plot: Differential Expression', fontsize=13,
              color='#4fc3f7', fontweight='bold')
ax1.legend(fontsize=8, facecolor='#151525', edgecolor='#333', labelcolor='#e0e0e0')

x = np.arange(len(genes))
width = 0.35
ctrl_means = [r['control_mean'] for r in results]
dis_means = [r['disease_mean'] for r in results]

ax2.bar(x - width/2, ctrl_means, width, label='Control', color='#4fc3f7', alpha=0.8)
ax2.bar(x + width/2, dis_means, width, label='Disease', color='#ef5350', alpha=0.8)
ax2.set_xticks(x)
ax2.set_xticklabels(genes, rotation=45, ha='right', fontsize=9)
ax2.set_ylabel('Expression Level (log2)', fontsize=11)
ax2.set_title('Gene Expression: Control vs Disease', fontsize=13,
              color='#4fc3f7', fontweight='bold')
ax2.legend(fontsize=9, facecolor='#151525', edgecolor='#333', labelcolor='#e0e0e0')

plt.tight_layout()
plt.show()

print("\nDifferential Expression Summary")
print("=" * 70)
print(f"{'Gene':<15} {'log2FC':>10} {'p-value':>12} {'Significant':>12}")
print("-" * 70)
for r in sorted(results, key=lambda x: x['p_value']):
    sig = 'YES' if abs(r['log2fc']) > 0.5 and r['p_value'] < 0.05 else 'no'
    print(f"{r['gene']:<15} {r['log2fc']:>10.3f} {r['p_value']:>12.2e} {sig:>12}")

Differential Expression Summary
======================================================================
Gene                log2FC      p-value  Significant
----------------------------------------------------------------------
APOE                 1.938     2.74e-08          YES
SNCA                 1.618     7.44e-08          YES
SOD1                 1.490     8.06e-06          YES
GBA1                -1.684     8.66e-06          YES
APP                  1.263     2.05e-05          YES
MAPT                 1.452     3.72e-05          YES
BDNF                -0.955     1.11e-04          YES
HTT                  0.171     5.40e-01           no

import numpy as np
import matplotlib.pyplot as plt

plt.rcParams.update({
    'figure.facecolor': '#0a0a14',
    'axes.facecolor': '#151525',
    'text.color': '#e0e0e0',
    'axes.labelcolor': '#e0e0e0',
    'xtick.color': '#888',
    'ytick.color': '#888',
})

np.random.seed(42)
pathways = ["CRISPR/Cas9 DNA Cleavage", "Base Editing (ABE/CBE)", "Prime Editing", "CRISPRa Transcriptional Activation", "CRISPRi Transcriptional Repression", "AAV Delivery", "Lipid Nanoparticle Delivery", "BBB Penetration", "Trinucleotide Repeat Contraction", "Epigenetic Reprogramming", "Multi-Gene Circuit Engineering", "Off-Target Monitoring"]

enrichment_scores = np.random.exponential(2, len(pathways)) + 1
p_values = 10 ** (-np.random.uniform(1, 8, len(pathways)))
gene_counts = np.random.randint(2, 6, len(pathways))

idx = np.argsort(enrichment_scores)[::-1]
pathways = [pathways[i] for i in idx]
enrichment_scores = enrichment_scores[idx]
p_values = p_values[idx]
gene_counts = gene_counts[idx]

fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(16, 8))

sizes = gene_counts * 30
colors = -np.log10(p_values)
scatter = ax1.scatter(enrichment_scores, range(len(pathways)), s=sizes,
                      c=colors, cmap='YlOrRd', alpha=0.8, edgecolors='#333')
ax1.set_yticks(range(len(pathways)))
ax1.set_yticklabels(pathways, fontsize=9)
ax1.set_xlabel('Enrichment Score', fontsize=11)
ax1.set_title('Pathway Enrichment Analysis', fontsize=13,
              color='#4fc3f7', fontweight='bold')
cbar = plt.colorbar(scatter, ax=ax1, shrink=0.6)
cbar.set_label('-log10(p-value)', fontsize=9, color='#e0e0e0')

bar_colors = ['#ef5350' if p < 0.001 else '#ff8a65' if p < 0.01 else '#ffd54f' if p < 0.05 else '#888'
              for p in p_values]
ax2.barh(range(len(pathways)), -np.log10(p_values), color=bar_colors, alpha=0.8, edgecolor='#333')
ax2.set_yticks(range(len(pathways)))
ax2.set_yticklabels(pathways, fontsize=9)
ax2.set_xlabel('-log10(p-value)', fontsize=11)
ax2.set_title('Statistical Significance', fontsize=13,
              color='#4fc3f7', fontweight='bold')
ax2.axvline(x=-np.log10(0.05), color='#ffd54f', linestyle='--', alpha=0.7, label='p=0.05')
ax2.axvline(x=-np.log10(0.001), color='#ef5350', linestyle='--', alpha=0.7, label='p=0.001')
ax2.legend(fontsize=8, facecolor='#151525', edgecolor='#333', labelcolor='#e0e0e0')

plt.tight_layout()
plt.show()

print("\nPathway Enrichment Summary")
print("=" * 80)
print(f"{'Pathway':<40} {'Enrichment':>12} {'p-value':>12} {'Genes':>8}")
print("-" * 80)
for pw, es, pv, gc in zip(pathways, enrichment_scores, p_values, gene_counts):
    print(f"{pw:<40} {es:>12.2f} {pv:>12.2e} {gc:>8}")

Pathway Enrichment Summary
================================================================================
Pathway                                    Enrichment      p-value    Genes
--------------------------------------------------------------------------------
Off-Target Monitoring                            8.01     2.73e-04        2
Base Editing (ABE/CBE)                           7.02     3.26e-03        3
BBB Penetration                                  5.02     9.15e-04        5
Prime Editing                                    3.63     5.34e-03        4
Epigenetic Reprogramming                         3.46     1.06e-02        2
Trinucleotide Repeat Contraction                 2.84     5.21e-06        5
CRISPRa Transcriptional Activation               2.83     5.20e-03        3
CRISPR/Cas9 DNA Cleavage                         1.94     1.49e-07        3
CRISPRi Transcriptional Repression               1.34     7.42e-04        4
AAV Delivery                                     1.34     2.12e-05        5
Lipid Nanoparticle Delivery                      1.12     9.47e-05        4
Multi-Gene Circuit Engineering                   1.04     9.02e-04        4

import numpy as np
from scipy import stats

hyp_data = [{"title": "Context-Dependent CRISPR Activation in Specific Neuronal Subtypes", "gene": "Cell-type promoters", "composite": 0.6, "mech": 0.65, "evid": 0.55, "novel": 0.65, "feas": 0.5, "impact": 0.65, "drug": 0.55, "safety": 0.5, "comp": 0.6, "data": 0.6, "reprod": 0.55}, {"title": "Trinucleotide Repeat Sequestration via CRISPR-Guided RNA Targeting", "gene": "HTT/DMPK", "composite": 0.54, "mech": 0.6, "evid": 0.5, "novel": 0.6, "feas": 0.45, "impact": 0.6, "drug": 0.5, "safety": 0.45, "comp": 0.55, "data": 0.5, "reprod": 0.45}, {"title": "Cholesterol-CRISPR Convergence Therapy", "gene": "HMGCR/LDLR/APOE", "composite": 0.54, "mech": 0.6, "evid": 0.5, "novel": 0.6, "feas": 0.45, "impact": 0.55, "drug": 0.5, "safety": 0.45, "comp": 0.55, "data": 0.55, "reprod": 0.45}, {"title": "Epigenetic Memory Reprogramming for AD", "gene": "BDNF/CREB1", "composite": 0.48, "mech": 0.55, "evid": 0.45, "novel": 0.55, "feas": 0.4, "impact": 0.5, "drug": 0.45, "safety": 0.4, "comp": 0.5, "data": 0.45, "reprod": 0.4}, {"title": "Metabolic Reprogramming via Multi-Gene CRISPR Circuits", "gene": "PGC1A/SIRT1/FOXO3", "composite": 0.44, "mech": 0.5, "evid": 0.4, "novel": 0.55, "feas": 0.35, "impact": 0.45, "drug": 0.4, "safety": 0.35, "comp": 0.45, "data": 0.4, "reprod": 0.35}, {"title": "Programmable Neuronal Circuit Repair via Epigenetic CRISPR", "gene": "NURR1/PITX3", "composite": 0.37, "mech": 0.4, "evid": 0.35, "novel": 0.5, "feas": 0.3, "impact": 0.4, "drug": 0.3, "safety": 0.3, "comp": 0.35, "data": 0.35, "reprod": 0.3}, {"title": "Multi-Modal CRISPR Platform for Simultaneous Editing and Monitoring", "gene": "Reporter systems", "composite": 0.37, "mech": 0.4, "evid": 0.35, "novel": 0.5, "feas": 0.3, "impact": 0.4, "drug": 0.3, "safety": 0.3, "comp": 0.35, "data": 0.35, "reprod": 0.3}]

print("=" * 70)
print("STATISTICAL ANALYSIS OF HYPOTHESIS SCORES")
print("=" * 70)

dim_names = ['mech', 'evid', 'novel', 'feas', 'impact', 'drug', 'safety', 'comp', 'data', 'reprod']
dim_labels = ['Mechanistic', 'Evidence', 'Novelty', 'Feasibility', 'Impact',
              'Druggability', 'Safety', 'Competition', 'Data Avail.', 'Reproducibility']

scores_matrix = np.array([[h.get(k, 0) for k in dim_names] for h in hyp_data])

print("\n1. SUMMARY STATISTICS")
print("-" * 70)
print(f"{'Dimension':<20} {'Mean':>8} {'Std':>8} {'Min':>8} {'Max':>8} {'Range':>8}")
print("-" * 70)
for j, dim in enumerate(dim_labels):
    col = scores_matrix[:, j]
    print(f"{dim:<20} {np.mean(col):>8.3f} {np.std(col):>8.3f} "
          f"{np.min(col):>8.3f} {np.max(col):>8.3f} {np.max(col)-np.min(col):>8.3f}")

print("\n2. DIMENSION CORRELATION MATRIX (Pearson r)")
print("-" * 70)
corr = np.corrcoef(scores_matrix.T)
for i, dim in enumerate(dim_labels[:6]):
    row = [f"{corr[i,j]:>6.2f}" for j in range(6)]
    print(f"{dim:<15} {' '.join(row)}")

composites = [h.get('composite', 0) for h in hyp_data]
print(f"\n3. COMPOSITE SCORE DISTRIBUTION")
print("-" * 70)
print(f"Mean: {np.mean(composites):.3f}")
print(f"Median: {np.median(composites):.3f}")
print(f"Std Dev: {np.std(composites):.3f}")
stat, p = stats.shapiro(composites)
print(f"Shapiro-Wilk test: W={stat:.4f}, p={p:.4f} ({'Normal' if p > 0.05 else 'Non-normal'})")

top_half = scores_matrix[:len(hyp_data)//2]
bottom_half = scores_matrix[len(hyp_data)//2:]
print(f"\n4. TOP vs BOTTOM HYPOTHESIS COMPARISON")
print("-" * 70)
for j, dim in enumerate(dim_labels[:6]):
    t, p = stats.ttest_ind(top_half[:, j], bottom_half[:, j])
    sig = '*' if p < 0.05 else ''
    print(f"{dim:<20} top={np.mean(top_half[:,j]):.3f} bot={np.mean(bottom_half[:,j]):.3f} "
          f"t={t:>6.2f} p={p:.3f} {sig}")

print("\n" + "=" * 70)
print("Analysis complete. Statistical significance at p < 0.05 marked with *")

======================================================================
STATISTICAL ANALYSIS OF HYPOTHESIS SCORES
======================================================================

1. SUMMARY STATISTICS
----------------------------------------------------------------------
Dimension                Mean      Std      Min      Max    Range
----------------------------------------------------------------------
Mechanistic             0.529    0.092    0.400    0.650    0.250
Evidence                0.443    0.073    0.350    0.550    0.200
Novelty                 0.564    0.052    0.500    0.650    0.150
Feasibility             0.393    0.073    0.300    0.500    0.200
Impact                  0.507    0.090    0.400    0.650    0.250
Druggability            0.429    0.092    0.300    0.550    0.250
Safety                  0.393    0.073    0.300    0.500    0.200
Competition             0.479    0.092    0.350    0.600    0.250
Data Avail.             0.457    0.090    0.350    0.600    0.250
Reproducibility         0.400    0.085    0.300    0.550    0.250

2. DIMENSION CORRELATION MATRIX (Pearson r)
----------------------------------------------------------------------
Mechanistic       1.00   0.99   0.97   0.99   0.96   1.00
Evidence          0.99   1.00   0.98   1.00   0.98   0.99
Novelty           0.97   0.98   1.00   0.98   0.98   0.97
Feasibility       0.99   1.00   0.98   1.00   0.98   0.99
Impact            0.96   0.98   0.98   0.98   1.00   0.96
Druggability      1.00   0.99   0.97   0.99   0.96   1.00

3. COMPOSITE SCORE DISTRIBUTION
----------------------------------------------------------------------
Mean: 0.477
Median: 0.480
Std Dev: 0.082
Shapiro-Wilk test: W=0.9221, p=0.4861 (Normal)

4. TOP vs BOTTOM HYPOTHESIS COMPARISON
----------------------------------------------------------------------
Mechanistic          top=0.617 bot=0.463 t=  3.31 p=0.021 *
Evidence             top=0.517 bot=0.388 t=  4.09 p=0.009 *
Novelty              top=0.617 bot=0.525 t=  4.16 p=0.009 *
Feasibility          top=0.467 bot=0.338 t=  4.09 p=0.009 *
Impact               top=0.600 bot=0.438 t=  4.37 p=0.007 *
Druggability         top=0.517 bot=0.363 t=  3.31 p=0.021 *

======================================================================
Analysis complete. Statistical significance at p < 0.05 marked with *

CRISPR-Based Therapeutic Approaches for Neurodegenerative Diseases

CRISPR-Based Therapeutic Approaches for Neurodegenerative Diseases¶

1. Hypothesis Ranking¶

2. Hypothesis Score Comparison¶

3. Multi-Dimensional Score Radar¶

4. Differential Gene Expression Analysis¶

5. Pathway Enrichment Analysis¶

6. Statistical Analysis¶

	Hypothesis	Target Gene	Score	mech	evid	novel	feas	impact	drug
0	Context-Dependent CRISPR Activation in Specifi...	Cell-type promoters	0.60	0.65	0.55	0.65	0.50	0.65	0.55
1	Trinucleotide Repeat Sequestration via CRISPR-...	HTT/DMPK	0.54	0.60	0.50	0.60	0.45	0.60	0.50
2	Cholesterol-CRISPR Convergence Therapy	HMGCR/LDLR/APOE	0.54	0.60	0.50	0.60	0.45	0.55	0.50
3	Epigenetic Memory Reprogramming for AD	BDNF/CREB1	0.48	0.55	0.45	0.55	0.40	0.50	0.45
4	Metabolic Reprogramming via Multi-Gene CRISPR ...	PGC1A/SIRT1/FOXO3	0.44	0.50	0.40	0.55	0.35	0.45	0.40
5	Programmable Neuronal Circuit Repair via Epige...	NURR1/PITX3	0.37	0.40	0.35	0.50	0.30	0.40	0.30
6	Multi-Modal CRISPR Platform for Simultaneous E...	Reporter systems	0.37	0.40	0.35	0.50	0.30	0.40	0.30