Linear Regression
Linear Regression
ipynb - Colab
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
from sklearn.datasets import load_diabetes
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_squared_error, r2_score
# Plot residuals
def plot_residuals(y_test, y_pred):
residuals = y_test - y_pred
plt.figure(figsize=(10, 6))
sns.histplot(residuals, kde=True)
plt.xlabel('Residuals')
plt.ylabel('Frequency')
plt.title('Residuals Distribution')
plt.show()
# Main workflow
def main():
# Load and prepare data
data = load_data()
X_train, X_test, y_train, y_test = prepare_data(data)
# Plot visualizations
plot_feature_distributions(data)
plot_actual_vs_predicted(y_test, y_pred)
plot_residuals(y_test, y_pred)
https://colab.research.google.com/drive/1D79M0mc1VqFBI-BSWQk8leEX87LjbAmI#printMode=true 2/3
7/30/24, 3:55 PM Untitled4.ipynb - Colab
s4 s5 s6 target
0 -0.002592 0.019907 -0.017646 151.0
1 -0.039493 -0.068332 -0.092204 75.0
2 -0.002592 0.002861 -0.025930 141.0
3 0.034309 0.022688 -0.009362 206.0
4 -0.002592 -0.031988 -0.046641 135.0
https://colab.research.google.com/drive/1D79M0mc1VqFBI-BSWQk8leEX87LjbAmI#printMode=true 3/3