# ====================================
# Common imports used across regression models
# ====================================

import numpy as np
import pandas as pd

from sklearn.datasets import fetch_california_housing
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler

from sklearn.metrics import (
    mean_squared_error,
    mean_absolute_error,
    r2_score
)

from pathlib import Path
import joblib
import matplotlib.pyplot as plt

# ====================================
# TensorFlow / Keras imports
# ====================================

import tensorflow as tf
from tensorflow import keras
from tensorflow.keras import layers

# ====================================
# Dataset loading
# ====================================

data = fetch_california_housing(as_frame=True)

X = data.data
y = data.target

# ====================================
# Train-test split
# ====================================

X_train, X_test, y_train, y_test = train_test_split(
    X,
    y,
    test_size=0.2,
    random_state=42
)

# ====================================
# Feature scaling
# ====================================

scaler = StandardScaler()

X_train_scaled = scaler.fit_transform(X_train)
X_test_scaled = scaler.transform(X_test)

# ====================================
# Model definition (Keras)
# ====================================

model = keras.Sequential([
    layers.Input(shape=(X_train_scaled.shape[1],)),
    layers.Dense(64, activation="relu"),
    layers.Dense(32, activation="relu"),
    layers.Dense(1)  # regression output
])

# ====================================
# Model compilation
# ====================================

model.compile(
    optimizer=keras.optimizers.Adam(learning_rate=0.001),
    loss="mse",
    metrics=["mae"]
)

# ====================================
# Model training
# ====================================

history = model.fit(
    X_train_scaled,
    y_train,
    epochs=100,
    batch_size=32,
    verbose=0
)

# ====================================
# Training history visualization
# ====================================

history_dict = history.history
epochs = range(1, len(history_dict["loss"]) + 1)

plt.figure(figsize=(12, 4))

plt.subplot(1, 2, 1)
plt.plot(epochs, history_dict["loss"], marker="o")
plt.title("Training Loss (MSE)")
plt.xlabel("Epoch")
plt.ylabel("Loss")
plt.grid(True)

plt.subplot(1, 2, 2)
plt.plot(epochs, history_dict["mae"], marker="o")
plt.title("Training MAE")
plt.xlabel("Epoch")
plt.ylabel("MAE")
plt.grid(True)

plt.tight_layout()
plt.show()

# ====================================
# Predictions
# ====================================

y_pred = model.predict(X_test_scaled).flatten()

129/129 ━━━━━━━━━━━━━━━━━━━━ 0s 971us/step

# ====================================
# Regression evaluation metrics
# ====================================

mse = mean_squared_error(y_test, y_pred)
rmse = np.sqrt(mse)
mae = mean_absolute_error(y_test, y_pred)
r2 = r2_score(y_test, y_pred)

mse, rmse, mae, r2

(0.26502627885126145,
 np.float64(0.5148070306933089),
 0.3496456228591051,
 0.7977530044039882)

# ====================================
# Model persistence
# ====================================

model_dir = Path("models/supervised_learning/regression/deep_learning_tensorflow")
model_dir.mkdir(parents=True, exist_ok=True)

# Save full Keras model (architecture + weights + config)
model.save(model_dir / "tensorflow_keras_regression_model")

# Save scaler used during training
joblib.dump(scaler, model_dir / "scaler.joblib")

# ====================================
# Imports
# ====================================

import numpy as np
import pandas as pd

from sklearn.datasets import fetch_california_housing
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler

from sklearn.metrics import mean_squared_error, mean_absolute_error, r2_score

from pathlib import Path
import joblib
import matplotlib.pyplot as plt

import tensorflow as tf
from tensorflow import keras
from tensorflow.keras import layers


# ====================================
# Dataset loading
# ====================================

data = fetch_california_housing(as_frame=True)
X = data.data
y = data.target


# ====================================
# Train-test split
# ====================================

X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.2, random_state=42
)


# ====================================
# Feature scaling
# ====================================

scaler = StandardScaler()
X_train_scaled = scaler.fit_transform(X_train)
X_test_scaled = scaler.transform(X_test)


# ====================================
# Model definition
# ====================================

model = keras.Sequential([
    layers.Input(shape=(X_train_scaled.shape[1],)),
    layers.Dense(64, activation="relu"),
    layers.Dense(32, activation="relu"),
    layers.Dense(1)
])


# ====================================
# Model compilation
# ====================================

model.compile(
    optimizer=keras.optimizers.Adam(learning_rate=0.001),
    loss="mse",
    metrics=["mae"]
)


# ====================================
# Model training
# ====================================

history = model.fit(
    X_train_scaled,
    y_train,
    epochs=100,
    batch_size=32,
    verbose=0
)


# ====================================
# Training history visualization
# ====================================

history_dict = history.history
epochs = range(1, len(history_dict["loss"]) + 1)

plt.figure(figsize=(12, 4))

plt.subplot(1, 2, 1)
plt.plot(epochs, history_dict["loss"], marker="o")
plt.title("Training Loss (MSE)")
plt.xlabel("Epoch")
plt.ylabel("Loss")
plt.grid(True)

plt.subplot(1, 2, 2)
plt.plot(epochs, history_dict["mae"], marker="o")
plt.title("Training MAE")
plt.xlabel("Epoch")
plt.ylabel("MAE")
plt.grid(True)

plt.tight_layout()
plt.show()


# ====================================
# Predictions
# ====================================

y_pred = model.predict(X_test_scaled).flatten()


# ====================================
# Evaluation
# ====================================

mse = mean_squared_error(y_test, y_pred)
rmse = np.sqrt(mse)
mae = mean_absolute_error(y_test, y_pred)
r2 = r2_score(y_test, y_pred)

mse, rmse, mae, r2


# ====================================
# Model persistence
# ====================================

model_dir = Path("models/supervised_learning/regression/deep_learning_tensorflow")
model_dir.mkdir(parents=True, exist_ok=True)

model.save(model_dir / "tensorflow_keras_regression_model")
joblib.dump(scaler, model_dir / "scaler.joblib")

Deep Learning – Regression (TensorFlow / Keras)¶

Notebook Roadmap (standard ML-Methods)¶

How this notebook should be read¶

What is Deep Learning Regression (in this context)?¶

What you should expect from the results¶

1. Project setup and common pipeline¶

What changes with TensorFlow / Keras¶

2. Dataset loading¶

Inputs and target¶

3. Train-test split¶

Why this matters¶

4. Feature scaling (why we do it)¶

Why scaling is essential¶

5. What is this model? (Deep Learning Regression – TensorFlow / Keras)¶

What problem are we solving?¶

How a neural network represents the problem¶

What each layer does conceptually¶

What each layer does conceptually¶

Why non-linearity matters in regression¶

Why the output layer is linear¶

How learning happens (high-level view)¶

What TensorFlow / Keras abstracts for us¶

Key takeaway¶

6. Model training (TensorFlow / Keras Regression)¶

What we just did¶

7. Model behavior and key parameters¶

Model capacity and architecture¶

Effect of increasing model capacity¶

Role of activation functions¶

Loss function behavior¶

Optimization dynamics (Adam)¶

Training duration (epochs)¶

Sensitivity to feature scaling¶

Generalization behavior¶

Key takeaway¶

8. Predictions¶

What happens inside model.predict()¶

What we have after this step¶

9. Model evaluation¶

Mean Squared Error (MSE)¶

Root Mean Squared Error (RMSE)¶

Mean Absolute Error (MAE)¶

R² score (coefficient of determination)¶

How to read these results together¶

Optional but useful: quick visual check¶

10. When to use it and when not to¶

When to use TensorFlow / Keras regression¶

When NOT to use it¶

Warning signs in practice¶

Key takeaway¶

11. Model persistence¶

What we saved and why¶

Reuse workflow (conceptual)¶

12. Mathematical formulation (deep dive)¶

Supervised regression dataset¶

Neural network as a function¶

Dense layer computation¶

Output layer for regression¶

Loss function (MSE)¶

Gradient-based optimization¶

Final takeaway¶

13. Final summary – Code only¶

What happens inside `model.predict()`¶