Underfitting vs. Overfitting — Regularization Spectrum

Implementation Example

# Regularization Spectrum

from sklearn.linear_model import Lasso, Ridge, ElasticNet
from sklearn.neural_network import MLPClassifier
import torch.nn as nn

# L1 Regularization (Lasso) - Feature selection
l1_model = Lasso(alpha=0.01)  # Higher alpha = more regularization
l1_model.fit(X_train, y_train)
# Many coefficients become exactly zero

# L2 Regularization (Ridge) - Shrinkage
l2_model = Ridge(alpha=1.0)
l2_model.fit(X_train, y_train)
# All coefficients small but non-zero

# Elastic Net - Combined L1 + L2
elastic_model = ElasticNet(alpha=0.1, l1_ratio=0.5)  # 50% L1, 50% L2
elastic_model.fit(X_train, y_train)

# Dropout for Neural Networks
class DropoutNet(nn.Module):
    def __init__(self):
        super().__init__()
        self.fc1 = nn.Linear(784, 256)
        self.dropout = nn.Dropout(0.5)  # 50% dropout
        self.fc2 = nn.Linear(256, 10)

    def forward(self, x):
        x = self.fc1(x)
        x = torch.relu(x)
        x = self.dropout(x)  # Apply dropout
        x = self.fc2(x)
        return x

# Batch Normalization
class BatchNormNet(nn.Module):
    def __init__(self):
        super().__init__()
        self.fc1 = nn.Linear(784, 256)
        self.bn = nn.BatchNorm1d(256)  # Normalize layer activations
        self.fc2 = nn.Linear(256, 10)

    def forward(self, x):
        x = self.fc1(x)
        x = self.bn(x)  # Normalize activations
        x = torch.relu(x)
        x = self.fc2(x)
        return x

Underfitting vs. Overfitting — Regularization Spectrum

Intent & Description

🎯 Intent

📋 Context

💡 Solution

Real-world Use Case

📌 TL;DR

Advantages

Disadvantages