0% found this document useful (0 votes)

7 views

Supple Maximizing Performance in Cs CuBiCl

Uploaded by

Pranjal

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

7 views

Supple Maximizing Performance in Cs CuBiCl

Uploaded by

Pranjal

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 5

Simulating and Predicting Conversion Efficiency in

Cs₂CuBiCl₆ based perovskite Cells: A Machine

Learning Approach
Nikhil Shrivastav, Jaya Madan and Rahul Pandey*

VLSI Centre of Excellence, Chitkara University Institute of Engineering and Technology, Chitkara University,
Punjab, India
*Corresponding authors

[email protected], and [email protected]

Random Forest 1-3

XGBoost 3-4

Random Forest-

import pandas as pd
import numpy as np
import seaborn as sns
import matplotlib.pyplot as plt
import keras_tuner as kt
import shap
from sklearn.model_selection import train_test_split
from sklearn.metrics import mean_squared_error, mean_absolute_error,
r2_score
from sklearn.preprocessing import StandardScaler
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense, Dropout
from tensorflow.keras.callbacks import EarlyStopping
# Import the RandomSearch tuner from keras_tuner
from keras_tuner.tuners import RandomSearch
df = pd.read_csv('/content/drive/MyDrive/ML/Nikhil_ML3.csv')
# Split data into features and target variables
X = df[['Thickness', 'doping', 'Defect']]
y = df['PCE (%)']

# Split data into features and target variables

X = df[['Thickness', 'doping', 'Defect']]
y = df['PCE']
# Splitting the data into training and testing sets
X_train, X_test, y_train, y_test = train_test_split (X, y,
test_size=0.2, random_state=42)
# Creating the RandomForestRegressor model
rf_model = RandomForestRegressor()
# Defining the hyperparameters to search
params = {
'max_depth': [3, 5, 7],
'n_estimators': [50, 100, 200],
'min_samples_leaf': [1, 3, 5]
}
# Performing GridSearchCV to find the best hyperparameters
grid_search = GridSearchCV(estimator=rf_model, param_grid=params, cv=3,
n_jobs=-1)
grid_search.fit(X_train, y_train)
# Getting the best hyperparameters
best_params = grid_search.best_params_
print("Best Hyperparameters:", best_params)
# Creating the final RandomForestRegressor model with the best
hyperparameters
final_rf_model = RandomForestRegressor(**best_params)
# Training the model
final_rf_model.fit(X_train, y_train)
# Predicting the target variable on the test set
y_test_pred = final_rf_model.predict(X_test)
# Calculating the mean squared error
mse = mean_squared_error(y_test, y_test_pred)
r2 = r2_score(y_test, y_test_pred)
cv_score = cross_val_score(grid_search.best_estimator_, X, y, cv=50)
print('Mean Squared Error:', mse)
print('R-squared:', r2)
print('Cross-Validation Score:', cv_score.mean())
print('Best Parameters:', grid_search.best_params_)
print('Best Score:', grid_search.best_score_)
Best Hyperparameters: {'max_depth': 7, 'min_samples_leaf': 1,
'n_estimators': 100}

Output
Mean Squared Error: 0.05262326227246941
R-squared: 0.9897033432799267
Cross-Validation Score: -5256.733933041297
Best Parameters: {'max_depth': 7, 'min_samples_leaf': 1, 'n_estimators':
100}
Best Score: 0.9914386927829856

Explaining the model's predictions using SHAP values

explainer = shap.TreeExplainer(final_rf_model)
shap_values = explainer.shap_values(X)

# Creating a SHAP plot to show the impact of all features

plt.savefig('18042023RF_PCE_SHAP values.png', dpi=600)
shap.summary_plot(shap_values, X)
# Predict on training and test sets
y_train_pred = final_rf_model.predict(X_train)

# Calculate the x-axis range for the plot

xmin = min(min(y_train_pred), min(y_test_pred))
xmax = max(max(y_train_pred), max(y_test_pred))

# Plotting actual PCE vs predicted FF for the training set and test set
plt.scatter(y_train, y_train_pred, c='blue', label='Training set')
plt.scatter(y_test, y_test_pred, c='red', label='Test set')
plt.plot(np.linspace(xmin, xmax, 100), np.linspace(xmin, xmax, 100), '-
-', label='Perfect fit')
plt.xlabel('Actual PCE')
plt.ylabel('Predicted PCE')
plt.title(' RF Actual vs Predicted | PCE')
plt.legend()
plt.savefig('10082023RF_PCE_Actual vs predicted.png', dpi=600)
plt.show()

XGBoost-

# Defining the hyperparameters to search

params = {
'learning_rate': [0.1, 0.3, 0.5],
'max_depth': [3, 5, 7],
'n_estimators': [50, 100, 200],
'min_child_weight': [1, 3, 5]
}

import pandas as pd
import numpy as np
import xgboost as xgb
import seaborn as sns
import matplotlib.pyplot as plt
from sklearn.model_selection import train_test_split, GridSearchCV
from sklearn.metrics import mean_squared_error, r2_score
from xgboost import XGBRegressor
from sklearn.model_selection import cross_val_score

# Creating the XGBRegressor model

# Read the CSV file
csv_file_path = '/content/drive/MyDrive/ML/Nikhil_ML3.csv'
df = pd.read_csv(csv_file_path)
# Assume the last column is the target variable and the rest are
features
X = df.iloc[:, :-1]
y = df.iloc[:, -1]

# Split the data into training and testing sets

X_train, X_test, y_train, y_test = train_test_split(X, y,
test_size=0.2, random_state=42)
xgb_model = xgb.XGBRegressor()

# Performing GridSearchCV to find the best hyperparameters

grid_search = GridSearchCV(estimator=xgb_model, param_grid=params,
cv=3, n_jobs=-1)
grid_search.fit(X_train, y_train)

best_params = grid_search.best_params_
print("Best Hyperparameters:", best_params)
# Creating the final XGBRegressor model with the best hyperparameters
final_xgb_model = xgb.XGBRegressor(**best_params)
# Training the model
final_xgb_model.fit(X_train, y_train)
# Predicting the target variable on the test set
y_test_pred = final_xgb_model.predict(X_test)
# Predict on training and test sets
y_train_pred = final_xgb_model.predict(X_train)
# Calculating the mean squared error
mse = mean_squared_error(y_test, y_test_pred)
r2 = r2_score(y_test, y_test_pred)
cv_score = cross_val_score(grid_search.best_estimator_, X, y, cv=50)
print('Mean Squared Error:', mse)
print('R-squared:', r2)
print('Cross-Validation Score:', cv_score.mean())
print('Best Parameters:', grid_search.best_params_)
print('Best Score:', grid_search.best_score_)

Output
Best Hyperparameters: {'learning_rate': 0.1, 'max_depth': 7,
'min_child_weight': 1, 'n_estimators': 200}
Mean Squared Error: 0.0014407104963233793
R-squared: 0.9997180999281869
Cross-Validation Score: -4718.083636367358
Best Parameters: {'learning_rate': 0.1, 'max_depth': 7, 'min_child_weight':
1, 'n_estimators': 200}
Best Score: 0.9998299680327589

# Visualizing the first tree in the trained model

fig, ax = plt.subplots(figsize=(30, 20), dpi=600)
xgb.plot_tree(final_xgb_model, num_trees=0, ax=ax)
plt.savefig('/content/drive/MyDrive/ML/Nikhil_ML3.csv_PCE_tree in the
trained model.png', dpi=600)
plt.show()

import shap
explainer = shap.TreeExplainer(final_xgb_model)
shap_values = explainer.shap_values(X)
# Creating a SHAP plot to show the impact of all features
plt.savefig('20052023XGB_AgBiSCl2NK_PCE_SHAP values.png', dpi=600)
shap.summary_plot(shap_values, X)
# Calculate the x-axis range for the plot
xmin = min(min(y_train_pred), min(y_test_pred))
xmax = max(max(y_train_pred), max(y_test_pred))
# Plotting actual PCE vs predicted PCE for the training set and test
set
plt.scatter(y_train, y_train_pred, c='blue', label='Training set')
plt.scatter(y_test, y_test_pred, c='red', label='Test set')
plt.plot(np.linspace(xmin, xmax, 100), np.linspace(xmin, xmax, 100), '-
-', label='Perfect fit')
plt.xlabel('Actual PCE')
plt.ylabel('Predicted PCE')
plt.title('Actual vs Predicted | PCE | AgBiSCl2NK')
plt.legend()
plt.savefig('20052023XGB_AgBiSCl2NK_PCE_Actual vs predicted.png',
dpi=600)
plt.show()

Multiple Choice Test Bank Questions No Feedback - Chapter 1
No ratings yet
Multiple Choice Test Bank Questions No Feedback - Chapter 1
47 pages
Assignment 8
No ratings yet
Assignment 8
6 pages
Diabetes Case Study - Jupyter Notebook
100% (1)
Diabetes Case Study - Jupyter Notebook
10 pages
Evans Analytics2e PPT 09
100% (3)
Evans Analytics2e PPT 09
50 pages
Data Mining Practicals
No ratings yet
Data Mining Practicals
22 pages
vertopal.com_Untitled57
No ratings yet
vertopal.com_Untitled57
4 pages
MlLabManualdocx 2024 09 04 22 02 58
No ratings yet
MlLabManualdocx 2024 09 04 22 02 58
19 pages
To Improve The Performance of Models Predicting Ba
No ratings yet
To Improve The Performance of Models Predicting Ba
6 pages
S-10
No ratings yet
S-10
11 pages
Hyperparameter Tuning
No ratings yet
Hyperparameter Tuning
7 pages
8 To 12 Jaimeen
No ratings yet
8 To 12 Jaimeen
34 pages
ml lab programs 2
No ratings yet
ml lab programs 2
16 pages
ml using python programs
No ratings yet
ml using python programs
12 pages
Regression Linaire Python Tome II
No ratings yet
Regression Linaire Python Tome II
10 pages
Soft Sensor Code
No ratings yet
Soft Sensor Code
4 pages
Soft Sensor Code
No ratings yet
Soft Sensor Code
4 pages
AI ML - Cycle 2 Programs (1)
No ratings yet
AI ML - Cycle 2 Programs (1)
15 pages
AIML PRACTICALS
No ratings yet
AIML PRACTICALS
22 pages
decision tree
No ratings yet
decision tree
6 pages
ANN_EXPERIENTIAL_LEARNING
No ratings yet
ANN_EXPERIENTIAL_LEARNING
43 pages
ML Algorithms
100% (1)
ML Algorithms
1 page
Classification Review
No ratings yet
Classification Review
8 pages
Udacity Machine Learning Analysis Supervised Learning
100% (1)
Udacity Machine Learning Analysis Supervised Learning
504 pages
16BCB0126 VL2018195002535 Pe003
No ratings yet
16BCB0126 VL2018195002535 Pe003
40 pages
Assignment 1
No ratings yet
Assignment 1
17 pages
sklearn
No ratings yet
sklearn
141 pages
HyperParameterTuning
No ratings yet
HyperParameterTuning
4 pages
5) Randomforest - Ipynb - Colaboratory
No ratings yet
5) Randomforest - Ipynb - Colaboratory
12 pages
frmCourseSyllabusIPDownload (2)
No ratings yet
frmCourseSyllabusIPDownload (2)
3 pages
ML_4,5 (1)
No ratings yet
ML_4,5 (1)
5 pages
Implementing Custom Randomsearchcv: 'Red' 'Blue'
No ratings yet
Implementing Custom Randomsearchcv: 'Red' 'Blue'
1 page
Hyperparameter Tuning
No ratings yet
Hyperparameter Tuning
9 pages
Tuning A CART's Hyperparameters: Elie Kawerk
No ratings yet
Tuning A CART's Hyperparameters: Elie Kawerk
26 pages
Aiml Ex 4-7
No ratings yet
Aiml Ex 4-7
8 pages
S-2
No ratings yet
S-2
10 pages
ML Codes
No ratings yet
ML Codes
9 pages
Machine Learning Presentaion
No ratings yet
Machine Learning Presentaion
15 pages
G 203008076 - 4 - Christhian Quiñonez - Ex1 - 2 A PDF
No ratings yet
G 203008076 - 4 - Christhian Quiñonez - Ex1 - 2 A PDF
20 pages
Scikit Learn What Were Covering
No ratings yet
Scikit Learn What Were Covering
15 pages
P05 The Regression Pipeline - Training and Testing Ans
No ratings yet
P05 The Regression Pipeline - Training and Testing Ans
13 pages
Import Numpy As NP Import Pandas As PD
No ratings yet
Import Numpy As NP Import Pandas As PD
7 pages
ML Remaining
No ratings yet
ML Remaining
17 pages
Exp4 - Supervised Learning
No ratings yet
Exp4 - Supervised Learning
10 pages
Zerox Ready
No ratings yet
Zerox Ready
21 pages
FB Models PDF
No ratings yet
FB Models PDF
14 pages
C2W3 Lab 01 Model Evaluation and Selection
No ratings yet
C2W3 Lab 01 Model Evaluation and Selection
21 pages
LAB-4 Report
No ratings yet
LAB-4 Report
21 pages
C2W3_Lab_01_Model_Evaluation_and_Selection
No ratings yet
C2W3_Lab_01_Model_Evaluation_and_Selection
21 pages
Approachin190808095205 PDF
No ratings yet
Approachin190808095205 PDF
112 pages
SVM
No ratings yet
SVM
8 pages
AI Lab M.Tech
No ratings yet
AI Lab M.Tech
29 pages
COMPARISON - Jupyter Notebook
No ratings yet
COMPARISON - Jupyter Notebook
5 pages
QB 1
No ratings yet
QB 1
11 pages
Assignment 4 Instructions
No ratings yet
Assignment 4 Instructions
4 pages
AIH_Lab2
No ratings yet
AIH_Lab2
10 pages
ML NEW Final Format
No ratings yet
ML NEW Final Format
37 pages
Scikit-Learn: Scikit-Learn Is An Open Source Python Library That
100% (1)
Scikit-Learn: Scikit-Learn Is An Open Source Python Library That
1 page
PR
No ratings yet
PR
17 pages
Guide
No ratings yet
Guide
24 pages
Scikit Learn Cheat Sheet Python
No ratings yet
Scikit Learn Cheat Sheet Python
1 page
Random Sample Consensus: Robust Estimation in Computer Vision
From Everand
Random Sample Consensus: Robust Estimation in Computer Vision
Fouad Sabry
No ratings yet
DATA MINING and MACHINE LEARNING: CLUSTER ANALYSIS and kNN CLASSIFIERS. Examples with MATLAB
From Everand
DATA MINING and MACHINE LEARNING: CLUSTER ANALYSIS and kNN CLASSIFIERS. Examples with MATLAB
César Pérez López
No ratings yet
DATA MINING AND MACHINE LEARNING. PREDICTIVE TECHNIQUES: REGRESSION, GENERALIZED LINEAR MODELS, SUPPORT VECTOR MACHINE AND NEURAL NETWORKS
From Everand
DATA MINING AND MACHINE LEARNING. PREDICTIVE TECHNIQUES: REGRESSION, GENERALIZED LINEAR MODELS, SUPPORT VECTOR MACHINE AND NEURAL NETWORKS
César Pérez López
No ratings yet
RSH Qam11 ch05
No ratings yet
RSH Qam11 ch05
84 pages
Stock Watson 4E Exercisesolutions Chapter4 Instructors
No ratings yet
Stock Watson 4E Exercisesolutions Chapter4 Instructors
16 pages
FInal - Soci 1005 Sem 1 Tutorial Questions
No ratings yet
FInal - Soci 1005 Sem 1 Tutorial Questions
7 pages
Econometrics Cheatsheet en
No ratings yet
Econometrics Cheatsheet en
3 pages
UE23MA242A - Unit-2 - Class-21 - 22 - Confidence Intervals Continuation Small Samples, Difference Between Means
No ratings yet
UE23MA242A - Unit-2 - Class-21 - 22 - Confidence Intervals Continuation Small Samples, Difference Between Means
43 pages
Statistical Flaws in Excel - Hans Pottel
100% (1)
Statistical Flaws in Excel - Hans Pottel
20 pages
Statistical Analysis of Spatial and Spatio Temporal Point Patterns Third Edition Peter J. Diggle 2025 Scribd Download
100% (1)
Statistical Analysis of Spatial and Spatio Temporal Point Patterns Third Edition Peter J. Diggle 2025 Scribd Download
67 pages
Ch. 8 Notes
No ratings yet
Ch. 8 Notes
5 pages
14-Statisticsandprobability q4 Mod14 Problemsolving
100% (1)
14-Statisticsandprobability q4 Mod14 Problemsolving
27 pages
Aryan Chugh BRM Lab File
No ratings yet
Aryan Chugh BRM Lab File
68 pages
Stata Commands
No ratings yet
Stata Commands
3 pages
Multiple Regression Analysis Further Issues
No ratings yet
Multiple Regression Analysis Further Issues
27 pages
Module 5 in Practical Research 2
No ratings yet
Module 5 in Practical Research 2
18 pages
Chapter12 Sampling Successive Occasions
No ratings yet
Chapter12 Sampling Successive Occasions
11 pages
2012 SPSS Linear Mixed Models (LMM) Options in SPSS
No ratings yet
2012 SPSS Linear Mixed Models (LMM) Options in SPSS
18 pages
Regression 2024
No ratings yet
Regression 2024
49 pages
Bradley_Efron
No ratings yet
Bradley_Efron
5 pages
8614 - Assignment 2 Solved (AG)
No ratings yet
8614 - Assignment 2 Solved (AG)
19 pages
Business Analytics Module 4 Summary
No ratings yet
Business Analytics Module 4 Summary
3 pages
DAO2702 - Sample Exam
No ratings yet
DAO2702 - Sample Exam
12 pages
Homework #3 - Answers Economics 113 Introduction To Econometrics Professor Spearot Due Wednesday, October 29th, 2008 - Beginning of Class
No ratings yet
Homework #3 - Answers Economics 113 Introduction To Econometrics Professor Spearot Due Wednesday, October 29th, 2008 - Beginning of Class
2 pages
Sampada Soni - 62310151
No ratings yet
Sampada Soni - 62310151
3 pages
USING DUMMY VARIABLES IN THE EVENT METHODOLOGY imre karafiath
No ratings yet
USING DUMMY VARIABLES IN THE EVENT METHODOLOGY imre karafiath
7 pages
Two-Way Classification (With One Observation Per Cell) :: y I P Q
No ratings yet
Two-Way Classification (With One Observation Per Cell) :: y I P Q
7 pages
A Second Course in Statistics: Regression Analysis: Journal of The American Statistical Association June 1997
No ratings yet
A Second Course in Statistics: Regression Analysis: Journal of The American Statistical Association June 1997
9 pages
Asymptotic Variance
No ratings yet
Asymptotic Variance
6 pages
xanh sm phụ lục
No ratings yet
xanh sm phụ lục
16 pages

Supple Maximizing Performance in Cs CuBiCl

Uploaded by

Supple Maximizing Performance in Cs CuBiCl

Uploaded by

Simulating and Predicting Conversion Efficiency in

Cs₂CuBiCl₆ based perovskite Cells: A Machine

[email protected], and [email protected]

Random Forest 1-3

# Split data into features and target variables

Explaining the model's predictions using SHAP values

# Creating a SHAP plot to show the impact of all features

# Calculate the x-axis range for the plot

# Defining the hyperparameters to search

# Creating the XGBRegressor model

# Split the data into training and testing sets

# Performing GridSearchCV to find the best hyperparameters

# Visualizing the first tree in the trained model

You might also like