I am following the process shown on Wine Quality Prediction End-to-End ML Project on Krish Naik's YouTube channel to do a Flight Fare Prediction Project.
I run this cell of model trainer pipeline on 04_model_trainer.ipynb:
try:
    config = ConfigurationManager()
    model_trainer_config = config.get_model_trainer_config()
    model_trainer_config = ModelTrainer(model_trainer_config)
    # model_trainer_config.train()
    model_trainer_config.initiate_model_training()
except Exception as e:
    raise e
I get this error:
TypeError: initiate_model_training() missing 4 required positional arguments: 'X_train', 'X_test', 'y_train', and 'y_test'
Here is the full traceback:
[2023-12-16 21:58:22,484: INFO: common: yaml file: config\config.yaml loaded successfully]
[2023-12-16 21:58:22,493: INFO: common: yaml file: params.yaml loaded successfully]
[2023-12-16 21:58:22,493: INFO: common: yaml file: schema.yaml loaded successfully]
[2023-12-16 21:58:22,493: INFO: common: created directory at: artifacts]
[2023-12-16 21:58:22,493: INFO: common: created directory at: artifacts/model_trainer]
---------------------------------------------------------------------------
TypeError                                 Traceback (most recent call last)
Cell In[25], line 8
      6     model_trainer_config.initiate_model_training()
      7 except Exception as e:
----> 8     raise e
Cell In[25], line 6
      4     model_trainer_config = ModelTrainer(model_trainer_config)
      5     # model_trainer_config.train()
----> 6     model_trainer_config.initiate_model_training()
      7 except Exception as e:
      8     raise e
TypeError: initiate_model_training() missing 4 required positional arguments: 'X_train', 'X_test', 'y_train', and 'y_test'
Here is the code of ModelTrainer class:
class ModelTrainer:
    def __init__(self, model_trainer_config):
        self.model_trainer_config = model_trainer_config  
    # def __init__(self):
        # self.model_trainer_config = ModelTrainerConfig()    
    def save_obj(file_path, obj):
        try:
            dir_path = os.path.dirname(file_path)
            os.makedirs(dir_path, exist_ok=True)
            with open(file_path, 'wb') as file_obj:
                joblib.dump(obj, file_obj, compress= ('gzip'))
        except Exception as e:
            logger.info('Error occured in utils save_obj')
            raise e
        
    def evaluate_model(X_train, y_train, X_test, y_test, models):
        try:
            report = {}
            for i in range(len(models)):
                model = list(models.values())[i]
                # Train model
                model.fit(X_train,y_train)
                # Predict Testing data
                y_test_pred = model.predict(X_test)
                # Get R2 scores for train and test data
                test_model_score = r2_score(y_test,y_test_pred)
                report[list(models.keys())[i]] =  test_model_score
            return report
        except Exception as e:
            logger.info('Exception occured during model training')
            raise e    
    def initiate_model_training(self, X_train, X_test, y_train, y_test):
        try:
            logger.info('Splitting ')
            models={
            'LinearRegression':LinearRegression(),
            'Lasso':Lasso(),
            'Ridge':Ridge(),
            'Elasticnet':ElasticNet(),
            'RandomForestRegressor': RandomForestRegressor(),
            'GradientBoostRegressor()' : GradientBoostingRegressor(),
            "AdaBoost" : AdaBoostRegressor(),
            'DecisionTreeRegressor' : DecisionTreeRegressor(),
            "SupportVectorRegressor" : SVR(),
            "KNN" : KNeighborsRegressor()
            }
            model_report:dict = ModelTrainer.evaluate_model(X_train,y_train, X_test, y_test, models)
            print(model_report)
            print("\n====================================================================================")
            logger.info(f'Model Report : {model_report}')
            # to get best model score from dictionary
            best_model_score = max(sorted(model_report.values()))
            best_model_name = list(model_report.keys())[
                list(model_report.values()).index(best_model_score)
            ]
            best_model = models[best_model_name]
            print(f"Best Model Found, Model Name :{best_model_name}, R2-score: {best_model_score}")
            print("\n====================================================================================")
            logger.info(f"Best Model Found, Model name: {best_model_name}, R2-score: {best_model_score}")
            logger.info(f"{best_model.feature_names_in_}")
            
            ModelTrainer.save_obj(
            file_path = self.model_trainer_config.trained_model_file_path,
            obj = best_model
            )
        except Exception as e:
            logger.info('Exception occured at model trianing')
            raise e
Here is my file in GitHub.
My file encoding is UTF-8
Would you please help me to fix this issue?
 
                        
So based on the logic that you have in your jupyter notebook, you should likely have
initial_model_training()modified to look like the below function:you should look through and understand how these https://drive.google.com/file/d/1c7k8i1l2X_r9i4yWAkQzxiP1Nu8_wqap/view these files work (from the tutorial that you are following), before you start to modify the code.