Function bodies 261 total

HealthWorkoutCorrelationAnalyzer._generate_visualizations method · python · L516-L533 (18 LOC)

src/analysis/explore_health_workout_correlations.py

    def _generate_visualizations(self, summary_df: pd.DataFrame) -> None:
        """Generate visualization plots."""
        print("\nGenerating visualizations...")

        # Create visualizations directory
        viz_dir = self.output_dir / "visualizations"
        viz_dir.mkdir(exist_ok=True)

        # 1. Correlation strength by health metric category
        self._plot_correlation_strength(summary_df, viz_dir)

        # 2. Lag distribution
        self._plot_lag_distribution(summary_df, viz_dir)

        # 3. Top correlations heatmap
        self._plot_top_correlations_heatmap(summary_df, viz_dir)

        print(f"Visualizations saved to: {viz_dir}")

HealthWorkoutCorrelationAnalyzer._plot_correlation_strength method · python · L535-L573 (39 LOC)

src/analysis/explore_health_workout_correlations.py

    def _plot_correlation_strength(self, summary_df: pd.DataFrame, viz_dir: Path) -> None:
        """Plot correlation strength by health metric category."""
        # Categorize health metrics
        def categorize_metric(metric: str) -> str:
            metric_lower = metric.lower()
            if any(keyword in metric_lower for keyword in ['sleep', 'rem']):
                return 'Sleep'
            elif 'stress' in metric_lower:
                return 'Stress'
            elif any(keyword in metric_lower for keyword in ['heart', 'hr']):
                return 'Heart'
            elif any(keyword in metric_lower for keyword in ['step', 'calori', 'distance']):
                return 'Activity'
            elif 'respir' in metric_lower:
                return 'Respiration'
            elif 'battery' in metric_lower:
                return 'Body Battery'
            else:
                return 'Other'

        summary_df['category'] = summary_df['health_metric'].apply(categorize_metr

HealthWorkoutCorrelationAnalyzer._plot_lag_distribution method · python · L575-L589 (15 LOC)

src/analysis/explore_health_workout_correlations.py

    def _plot_lag_distribution(self, summary_df: pd.DataFrame, viz_dir: Path) -> None:
        """Plot distribution of optimal lags."""
        plt.figure(figsize=(10, 6))

        # Histogram of lags
        plt.hist(summary_df['strongest_lag'], bins=range(self.max_lag + 2),
                edgecolor='black', alpha=0.7)
        plt.title('Distribution of Optimal Lag Days')
        plt.xlabel('Lag (days)')
        plt.ylabel('Count')
        plt.xticks(range(self.max_lag + 1))

        plot_path = viz_dir / "lag_distribution.png"
        plt.savefig(plot_path, dpi=150)
        plt.close()

HealthWorkoutCorrelationAnalyzer._plot_top_correlations_heatmap method · python · L591-L616 (26 LOC)

src/analysis/explore_health_workout_correlations.py

    def _plot_top_correlations_heatmap(self, summary_df: pd.DataFrame, viz_dir: Path) -> None:
        """Create heatmap of top correlations."""
        # Get top 20 correlations by absolute value
        top_n = min(20, len(summary_df))
        top_df = summary_df.nlargest(top_n, 'abs_correlation').copy()

        # Create pivot table for heatmap
        pivot_data = top_df.pivot_table(
            values='correlation',
            index='health_metric',
            columns='workout_var',
            aggfunc='first'
        )

        if pivot_data.empty:
            return

        plt.figure(figsize=(12, 10))
        sns.heatmap(pivot_data, annot=True, fmt='.2f', cmap='RdBu_r',
                   center=0, square=True, cbar_kws={'label': 'Correlation (r)'})
        plt.title(f'Top {top_n} Health-Workout Correlations')
        plt.tight_layout()

        plot_path = viz_dir / "top_correlations_heatmap.png"
        plt.savefig(plot_path, dpi=150)
        plt.close()

main function · python · L619-L690 (72 LOC)

src/analysis/explore_health_workout_correlations.py

def main():
    """Main entry point."""
    parser = argparse.ArgumentParser(
        description="Explore correlations between workouts and health metrics"
    )

    # Required arguments
    parser.add_argument(
        "--workout-vars",
        type=str,
        required=True,
        help="Comma-separated list of workout variables to analyze"
    )

    # Analysis parameters
    parser.add_argument(
        "--max-lag",
        type=int,
        default=7,
        help="Maximum lag to compute correlations for (default: 7)"
    )
    parser.add_argument(
        "--max-metrics",
        type=int,
        default=20,
        help="Maximum number of health metrics to analyze (default: 20)"
    )
    parser.add_argument(
        "--min-observations",
        type=int,
        default=50,
        help="Minimum number of observations required (default: 50)"
    )

    # Output
    parser.add_argument(
        "--output-dir",
        type=str,
        default="output/health_correlations",

load_correlation_data function · python · L29-L36 (8 LOC)