#   Used for numerical operations and data manipulation.
import numpy as np 
import pandas as pd

#  Provides a real-world regression dataset for demonstration purposes.
from sklearn.datasets import fetch_california_housing

#  Ensures a clean separation between training and test data.
from sklearn.model_selection import train_test_split

#  Applies feature scaling to ensure numerical stability and pipeline consistency.
from sklearn.preprocessing import StandardScaler

#  Used later to assess model performance.
from sklearn.metrics import mean_squared_error, r2_score , mean_absolute_error

# Used for stabil path.
from pathlib import Path

#  Used to save trained models and preprocessing objects.
import joblib

data = fetch_california_housing(as_frame=True)

X = data.data
y = data.target

X_train, X_test, y_train, y_test = train_test_split(
    X,
    y,
    test_size=0.2,
    random_state=42
)

scaler = StandardScaler()

X_train_scaled = scaler.fit_transform(X_train)
X_test_scaled = scaler.transform(X_test)

from sklearn.linear_model import LinearRegression

# Initialize the model
model = LinearRegression()

# Train the model on the scaled training data
model.fit(X_train_scaled, y_train)

LinearRegression()

coefficients = pd.Series(model.coef_, index=X.columns)
intercept = model.intercept_

coefficients, intercept

(MedInc        0.854383
 HouseAge      0.122546
 AveRooms     -0.294410
 AveBedrms     0.339259
 Population   -0.002308
 AveOccup     -0.040829
 Latitude     -0.896929
 Longitude    -0.869842
 dtype: float64,
 np.float64(2.071946937378881))

import matplotlib.pyplot as plt

# Select feature to visualize
feature_name = X.columns[0]
feature_index = 0

# Create artificial input data
X_vis = np.zeros((100, X_train_scaled.shape[1]))
X_vis[:, feature_index] = np.linspace(
    X_train_scaled[:, feature_index].min(),
    X_train_scaled[:, feature_index].max(),
    100
)

# Predictions
y_vis_pred = model.predict(X_vis)

# Plot
plt.figure(figsize=(8, 5))

plt.scatter(
    X_train_scaled[:, feature_index],
    y_train,
    alpha=0.25,
    label="Training data"
)

plt.plot(
    X_vis[:, feature_index],
    y_vis_pred,
    linewidth=3,
    label="Linear Regression prediction"
)

plt.xlabel(feature_name)
plt.ylabel("Target")
plt.title("Effect of a single feature on predictions")
plt.legend()
plt.grid(True)
plt.show()

# Generate predictions on the test set

y_pred = model.predict(X_test_scaled)

# Compute evaluation metrics

mae = mean_absolute_error(y_test, y_pred)
mse = mean_squared_error(y_test, y_pred)
rmse = np.sqrt(mse)
r2 = r2_score(y_test, y_pred)

mae, mse, rmse, r2

(0.5332001304956565,
 0.5558915986952444,
 np.float64(0.7455813830127764),
 0.5757877060324508)

# Define model directory
model_dir = Path("models/supervised_learning/regression/linear_regression")

# Create directory if it does not exist
model_dir.mkdir(parents=True, exist_ok=True)

# Save model and scaler
joblib.dump(model, model_dir / "linear_regression_model.joblib")
joblib.dump(scaler, model_dir / "scaler.joblib")

['models\\supervised_learning\\regression\\linear_regression\\scaler.joblib']

# ====================================
# Imports
# ====================================

import numpy as np
import pandas as pd

from sklearn.datasets import fetch_california_housing
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.linear_model import LinearRegression

from sklearn.metrics import mean_absolute_error, mean_squared_error, r2_score

from pathlib import Path
import joblib


# ====================================
# Dataset loading
# ====================================

data = fetch_california_housing(as_frame=True)

X = data.data
y = data.target


# ====================================
# Train-test split
# ====================================

X_train, X_test, y_train, y_test = train_test_split(
    X,
    y,
    test_size=0.2,
    random_state=42
)


# ====================================
# Feature scaling
# ====================================

scaler = StandardScaler()

X_train_scaled = scaler.fit_transform(X_train)
X_test_scaled = scaler.transform(X_test)


# ====================================
# Model initialization
# ====================================

lr_model = LinearRegression()


# ====================================
# Model training
# ====================================

lr_model.fit(X_train_scaled, y_train)


# ====================================
# Predictions
# ====================================

y_pred_lr = lr_model.predict(X_test_scaled)


# ====================================
# Model evaluation
# ====================================

mae = mean_absolute_error(y_test, y_pred_lr)
mse = mean_squared_error(y_test, y_pred_lr)
rmse = np.sqrt(mse)
r2 = r2_score(y_test, y_pred_lr)

mae, mse, rmse, r2


# ====================================
# Model persistence
# ====================================

model_dir = Path("models/supervised_learning/regression/linear_regression")
model_dir.mkdir(parents=True, exist_ok=True)

joblib.dump(lr_model, model_dir / "linear_regression_model.joblib")
joblib.dump(scaler, model_dir / "scaler.joblib")

	fit_intercept fit_intercept: bool, default=True Whether to calculate the intercept for this model. If set to False, no intercept will be used in calculations (i.e. data is expected to be centered).	True
	copy_X copy_X: bool, default=True If True, X will be copied; else, it may be overwritten.	True
	tol tol: float, default=1e-6 The precision of the solution (`coef_`) is determined by `tol` which specifies a different convergence criterion for the `lsqr` solver. `tol` is set as `atol` and `btol` of :func:`scipy.sparse.linalg.lsqr` when fitting on sparse training data. This parameter has no effect when fitting on dense data. .. versionadded:: 1.7	1e-06
	n_jobs n_jobs: int, default=None The number of jobs to use for the computation. This will only provide speedup in case of sufficiently large problems, that is if firstly `n_targets > 1` and secondly `X` is sparse or if `positive` is set to `True`. ``None`` means 1 unless in a :obj:`joblib.parallel_backend` context. ``-1`` means using all processors. See :term:`Glossary ` for more details.	None
	positive positive: bool, default=False When set to ``True``, forces the coefficients to be positive. This option is only supported for dense arrays. For a comparison between a linear regression model with positive constraints on the regression coefficients and a linear regression without such constraints, see :ref:`sphx_glr_auto_examples_linear_model_plot_nnls.py`. .. versionadded:: 0.24	False

Supervised Learning -> Linear Regression¶

How this notebook should be read¶

What is Linear Regression?¶

Why we start with intuition¶

What you should expect from the results¶

1. Project setup and common pipeline¶

Why having a common pipeline matters¶

____________________________________¶

2. Dataset loading¶

About the dataset¶

What we obtained¶

____________________________________¶

3. Train-test split¶

Why we split the data¶

What these parameters mean¶

What we have after this step¶

____________________________________¶

4. Feature scaling (why we do it)¶

Why feature scaling is important¶

Does Linear Regression require scaling?¶

Important rule: fit only on training data¶

What we have after this step¶

____________________________________¶

5. What is this model?¶

The core idea¶

Thinking in simple terms¶

From line to prediction¶

____________________________________¶

6. Model training¶

What we have after training¶

____________________________________¶

7. Model parameters interpretation¶

What parameters does Linear Regression learn?¶

How to interpret the coefficients¶

Intercept explained¶

Why parameter interpretation matters¶

Extra:¶

What this plot shows¶

____________________________________¶

8. Predictions¶

What we obtained¶

____________________________________¶

9. Model evaluation¶

Why evaluation is necessary¶

Metrics explanation¶

Mean Absolute Error (MAE)¶

How to interpret the results¶

____________________________________¶

10. When to use it and when not to¶

When Linear Regression is a good choice¶

Typical warning signs¶

____________________________________¶

11. Model persistence¶

Important rule: save the preprocessing too¶

____________________________________¶

12. Mathematical formulation¶

Model equation¶

Objective function¶

Analytical solution in scikit-learn¶

Final takeaway¶

____________________________________¶

Final summary – Code only¶