import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from pathlib import Path

# Set style
sns.set_style("whitegrid")
plt.rcParams['figure.figsize'] = (14, 8)

# Load time horizon results
time_horizons_dir = Path('/Users/sarahurbut/aladynoulli2/pyScripts/dec_6_revision/new_notebooks/results/time_horizons/pooled_retrospective')
washout_time_horizons_dir = Path('/Users/sarahurbut/aladynoulli2/pyScripts/dec_6_revision/new_notebooks/results/washout_time_horizons/pooled_retrospective')

# Load baseline (no washout)
baseline_10yr = pd.read_csv(time_horizons_dir / 'static_10yr_results.csv')

# Load washout (1-year exclusion)
washout_10yr = pd.read_csv(washout_time_horizons_dir / 'washout_1yr_10yr_static_results.csv')

# Merge for comparison
comparison = baseline_10yr[['Disease', 'AUC']].merge(
    washout_10yr[['Disease', 'AUC']],
    on='Disease',
    suffixes=('_baseline', '_washout')
)
comparison['AUC_drop'] = comparison['AUC_baseline'] - comparison['AUC_washout']
comparison = comparison.sort_values('AUC_drop', ascending=False)

print("="*80)
print("APPROACH 1: TIME HORIZON ANALYSIS (10-Year Predictions)")
print("="*80)
print(f"\nMean AUC drop: {comparison['AUC_drop'].mean():.4f}")
print(f"Median AUC drop: {comparison['AUC_drop'].median():.4f}")
print(f"\nTop 10 diseases by AUC drop:")
print(comparison.head(10).to_string(index=False))

# Visualization
fig, ax = plt.subplots(figsize=(12, 8))
ax.scatter(comparison['AUC_baseline'], comparison['AUC_washout'], alpha=0.6)
ax.plot([0, 1], [0, 1], 'r--', label='No change')
ax.set_xlabel('AUC (10-year, no washout)', fontsize=12)
ax.set_ylabel('AUC (10-year, 1-year exclusion)', fontsize=12)
ax.set_title('Time Horizon Analysis: 10-Year Predictions with 1-Year Exclusion', fontsize=14)
ax.legend()
ax.grid(True, alpha=0.3)
plt.tight_layout()
plt.show()

print("\n💡 Key Insight: Minimal impact (<2-3% AUC drop) suggests diagnostic cascades")
print("   are not a major driver of long-term predictions.")

================================================================================
APPROACH 1: TIME HORIZON ANALYSIS (10-Year Predictions)
================================================================================

Mean AUC drop: 0.0084
Median AUC drop: 0.0060

Top 10 diseases by AUC drop:
           Disease  AUC_baseline  AUC_washout  AUC_drop
    Crohns_Disease      0.580017     0.547517  0.032499
Multiple_Sclerosis      0.530927     0.501277  0.029650
Ulcerative_Colitis      0.582669     0.562436  0.020234
     Breast_Cancer      0.550715     0.531814  0.018901
  Bipolar_Disorder      0.481331     0.463538  0.017793
            Asthma      0.525205     0.509968  0.015236
   Prostate_Cancer      0.682770     0.672125  0.010645
             ASCVD      0.732897     0.722593  0.010304
 Colorectal_Cancer      0.645633     0.635438  0.010195
          Diabetes      0.630205     0.620962  0.009243

💡 Key Insight: Minimal impact (<2-3% AUC drop) suggests diagnostic cascades
   are not a major driver of long-term predictions.

# Load enrollment-trained offset results
enrollment_results_file = Path('/Users/sarahurbut/aladynoulli2/pyScripts/dec_6_revision/new_notebooks/results/washout/pooled_retrospective/washout_comparison_all_offsets.csv')

if enrollment_results_file.exists():
    enrollment_df = pd.read_csv(enrollment_results_file)
    # The first column is unnamed, so rename it to 'Disease'
    enrollment_df.columns = ['Disease'] + list(enrollment_df.columns[1:])
    
    print("="*80)
    print("APPROACH 2: FLOATING PREDICTION (Enrollment-Trained)")
    print("="*80)
    print(f"\n{len(enrollment_df)} diseases analyzed")
    
    # Extract key columns
    if '0yr_AUC' in enrollment_df.columns and '1yr_AUC' in enrollment_df.columns:
        comparison = enrollment_df[['Disease', '0yr_AUC', '1yr_AUC']].copy()
        comparison['AUC_drop'] = comparison['0yr_AUC'] - comparison['1yr_AUC']
        comparison = comparison.sort_values('AUC_drop', ascending=False)
        
        print(f"\nMean AUC drop (0yr → 1yr): {comparison['AUC_drop'].mean():.4f}")
        print(f"Median AUC drop: {comparison['AUC_drop'].median():.4f}")
        print(f"\nTop 10 diseases by AUC drop:")
        print(comparison.head(10)[['Disease', '0yr_AUC', '1yr_AUC', 'AUC_drop']].to_string(index=False))
        
        # Visualization
        fig, ax = plt.subplots(figsize=(12, 8))
        ax.scatter(comparison['0yr_AUC'], comparison['1yr_AUC'], alpha=0.6)
        ax.plot([0, 1], [0, 1], 'r--', label='No change')
        ax.set_xlabel('AUC (0yr offset)', fontsize=12)
        ax.set_ylabel('AUC (1yr offset)', fontsize=12)
        ax.set_title('Floating Prediction: Enrollment-Trained Model at Different Offsets', fontsize=14)
        ax.legend()
        ax.grid(True, alpha=0.3)
        plt.tight_layout()
        plt.show()
        
        print("\n💡 Key Insight: Robust performance across different prediction horizons")
        print("   from enrollment, demonstrating forward prediction capability.")
    else:
        print("⚠️  Expected columns not found in enrollment results file")
        print(f"Available columns: {enrollment_df.columns.tolist()}")
else:
    print(f"⚠️  Enrollment results file not found: {enrollment_results_file}")

================================================================================
APPROACH 2: FLOATING PREDICTION (Enrollment-Trained)
================================================================================

28 diseases analyzed

Mean AUC drop (0yr → 1yr): 0.1144
Median AUC drop: 0.1016

Top 10 diseases by AUC drop:
           Disease  0yr_AUC  1yr_AUC  AUC_drop
    Crohns_Disease 0.896424 0.553769  0.342655
  Bipolar_Disorder 0.758267 0.439477  0.318791
Multiple_Sclerosis 0.839507 0.590238  0.249269
Ulcerative_Colitis 0.816088 0.574732  0.241356
            Asthma 0.689856 0.502862  0.186994
     Breast_Cancer 0.781816 0.596627  0.185189
        Depression 0.615522 0.448466  0.167057
 Colorectal_Cancer 0.825333 0.684249  0.141085
    Bladder_Cancer 0.824517 0.693242  0.131275
             ASCVD 0.880921 0.751321  0.129600

💡 Key Insight: Robust performance across different prediction horizons
   from enrollment, demonstrating forward prediction capability.

# Load fixed timepoint results
fixed_timepoint_file = Path('/Users/sarahurbut/aladynoulli2/pyScripts/dec_6_revision/new_notebooks/results/washout_fixed_timepoint/pooled_retrospective/washout_results_by_disease_pivot.csv')

if fixed_timepoint_file.exists():
    fixed_df = pd.read_csv(fixed_timepoint_file)
    
    print("="*80)
    print("APPROACH 3: FIXED PREDICTION OVER 10-YEAR UPDATES")
    print("="*80)
    print(f"\n{len(fixed_df)} diseases analyzed")
    print(f"Timepoints evaluated: 1-9 (enrollment+1yr through enrollment+9yr)")
    
    # Reshape for visualization: convert wide format to long format
    # Original: Disease, Timepoint, Washout_0yr, Washout_1yr, Washout_2yr
    # Target: Disease, Timepoint, Washout_years, AUC
    
    df_long = []
    for _, row in fixed_df.iterrows():
        disease = row['Disease']
        timepoint = row['Timepoint']
        for washout_col in ['Washout_0yr', 'Washout_1yr', 'Washout_2yr']:
            if pd.notna(row[washout_col]):
                washout_years = int(washout_col.split('_')[1].replace('yr', ''))
                df_long.append({
                    'Disease': disease,
                    'Timepoint': timepoint,
                    'Washout_years': washout_years,
                    'AUC': row[washout_col]
                })
    
    df_comprehensive = pd.DataFrame(df_long)
    
    # Select key diseases for visualization
    key_diseases = ['ASCVD', 'Parkinsons', 'Prostate_Cancer', 'Atrial_Fib', 'Breast_Cancer', 
                    'Diabetes', 'CKD', 'COPD', 'Colorectal_Cancer', 'Heart_Failure']
    
    available_diseases = [d for d in key_diseases if d in df_comprehensive['Disease'].unique()]
    
    if len(available_diseases) > 0:
        # Plot heatmaps for key diseases
        fig, axes = plt.subplots(2, 2, figsize=(16, 12))
        axes = axes.flatten()
        
        for idx, disease in enumerate(available_diseases[:4]):  # Plot top 4
            ax = axes[idx]
            
            disease_df = df_comprehensive[df_comprehensive['Disease'] == disease]
            pivot = disease_df.pivot(index='Timepoint', columns='Washout_years', values='AUC')
            
            # Create heatmap
            sns.heatmap(pivot, annot=True, fmt='.3f', cmap='RdYlGn', 
                       vmin=0.4, vmax=1.0, ax=ax, cbar_kws={'label': 'AUC'})
            
            ax.set_title(f'{disease}\nAUC by Timepoint and Washout', fontsize=12, fontweight='bold')
            ax.set_xlabel('Washout (years)', fontsize=10)
            ax.set_ylabel('Prediction Timepoint\n(enrollment + N)', fontsize=10)
        
        plt.tight_layout()
        plt.show()
        
        # Summary heatmap: Average AUC across all diseases
        fig, ax = plt.subplots(1, 1, figsize=(10, 8))
        
        avg_pivot = df_comprehensive.groupby(['Timepoint', 'Washout_years'])['AUC'].mean().unstack()
        
        sns.heatmap(avg_pivot, annot=True, fmt='.3f', cmap='RdYlGn',
                   vmin=0.5, vmax=0.9, ax=ax, cbar_kws={'label': 'Mean AUC'})
        
        ax.set_title('Average AUC Across All Diseases\nby Prediction Timepoint and Washout Period', 
                    fontsize=14, fontweight='bold')
        ax.set_xlabel('Washout (years)', fontsize=12)
        ax.set_ylabel('Prediction Timepoint (enrollment + N)', fontsize=12)
        
        plt.tight_layout()
        plt.show()
        
        print("\n" + "="*80)
        print("KEY INSIGHTS FROM COMPREHENSIVE ANALYSIS")
        print("="*80)
        print("\n1. Washout impact varies by prediction timepoint")
        print("2. Some diseases maintain performance better with washout")
        print("3. Early timepoints (enrollment+1, +2) show larger washout effects")
        print("4. Later timepoints may show different patterns")
        
        print("\n💡 Key Insight: Provides comprehensive view of washout effects")
        print("   across multiple evaluation timepoints over 10 years.")
        print("\nSee R2_Washout_Continued.ipynb for detailed analysis.")
    else:
        print("\n💡 Key Insight: Provides comprehensive view of washout effects")
        print("   across multiple evaluation timepoints over 10 years.")
        print("\nSee R2_Washout_Continued.ipynb for detailed analysis.")
else:
    print(f"⚠️  Fixed timepoint file not found: {fixed_timepoint_file}")
    print("\nSee R2_Washout_Continued.ipynb for detailed analysis.")

================================================================================
APPROACH 3: FIXED PREDICTION OVER 10-YEAR UPDATES
================================================================================

250 diseases analyzed
Timepoints evaluated: 1-9 (enrollment+1yr through enrollment+9yr)

================================================================================
KEY INSIGHTS FROM COMPREHENSIVE ANALYSIS
================================================================================

1. Washout impact varies by prediction timepoint
2. Some diseases maintain performance better with washout
3. Early timepoints (enrollment+1, +2) show larger washout effects
4. Later timepoints may show different patterns

💡 Key Insight: Provides comprehensive view of washout effects
   across multiple evaluation timepoints over 10 years.

See R2_Washout_Continued.ipynb for detailed analysis.

R2: Comprehensive Washout Approaches Comparison¶

Overview¶

Approach 1: Time Horizon Analysis¶

Approach 2: Floating Prediction (Enrollment-Trained)¶

Approach 3: Fixed Prediction Over 10-Year Updates¶

Approach 4: Fixed Timepoint (Delphi Comparison)¶

Summary¶

Approach 1: Time Horizon Analysis¶

Approach 2: Floating Prediction (Enrollment-Trained)¶

Approach 3: Fixed Prediction Over 10-Year Updates¶

Summary and Conclusions¶

Key Findings Across All Approaches¶

Implications¶

References¶