Spaces:

Sonny4Sonnix
/

Streamlit_app_for_sales_prediction

Sleeping

App Files Files Community

Streamlit_app_for_sales_prediction / src /modelling.py

Sonny4Sonnix

Upload 6 files

f1e0278 over 1 year ago

raw

history blame contribute delete

5.34 kB

	## libraries importation
	##data handling
	import pandas as pd
	import numpy as np
	###encoders and model
	from prophet import Prophet
	from sklearn.preprocessing import LabelEncoder
	from sklearn.preprocessing import OrdinalEncoder
	from category_encoders import BinaryEncoder
	##error metrics
	from sklearn.metrics import mean_absolute_error as MAE
	from sklearn.metrics import mean_squared_log_error as MSLE
	from sklearn.metrics import mean_squared_error as MSE
	from statsmodels.tools.eval_measures import rmse
	##visualization and webapp
	import plotly.express as ex
	import plotly.offline as po
	from prophet.plot import plot_plotly, plot_components_plotly
	import streamlit as st
	import matplotlib.pyplot as plt
	import seaborn as sns

	##model loading
	import joblib

	###importing my dataset

	##our train
	train= pd.read_csv("dataframes/train.csv")
	train= train.drop("Unnamed: 0", axis=1)
	train_target= train[["y"]]

	##getting our test with target

	t_w_target= pd.read_csv("dataframes/test_with_y.csv")

	##filtering out our y

	test= pd.read_csv("dataframes/test.csv")
	test_target= t_w_target[["sales"]]


	##creating a copy of my train

	train_copy= train.copy()


	## data encoding

	##importing my binary encoder
	BE= BinaryEncoder(cols= "holiday")

	##fitting and transforming my train dataset

	train= BE.fit_transform(train.drop("y", axis=1))


	##instantiating and using my ordinal encoder
	##creating a rank
	rank= ["National", "Regional", "Local", "Not Holiday"]
	OE= OrdinalEncoder(categories=[rank])
	train[["locale"]]=OE.fit_transform(train[["locale"]])

	##finally my label encoder
	LE= LabelEncoder()
	##transforming our train
	train["transferred"]=LE.fit_transform(train["transferred"])

	##loading my train set again

	train.head()


	##everything has works so let's fit our model once again

	model=Prophet(yearly_seasonality= True, seasonality_mode= "multiplicative", seasonality_prior_scale=25)

	##stating my exogenous variables (extra regressors)
	exo_cols=[ 'holiday_0', 'holiday_1', 'holiday_2', 'locale', 'transferred', 'onpromotion', 'transactions']

	for cols in exo_cols:
	model.add_regressor(cols, standardize=True)

	##concating my train features with my train target to allow me fit

	full_train= pd.merge(left= train, right= train_target,left_index=True, right_index=True)

	full_train

	##fitting out data on the full train
	model.fit(full_train)


	##let's make a prediction on our test

	###before that I will make a copy of my test sample

	test_features= test.copy()

	test_features= test_features.drop("Unnamed: 0", axis= 1)

	test_features
	##rename the date column

	test_features= test_features.rename(columns= {"date": "ds"})

	##using my binary encoder to transform it
	##transforming my test
	test_features[["locale"]]= OE.transform(test_features[["locale"]])

	test_features["transferred"]= LE.transform(test_features["transferred"])
	test_features= BE.transform(test_features)

	test_features
	##making predictions on my test data

	eval_fbp= model.predict(test_features)

	##filtering out my yhat to let me calculate my error metrics
	eval= eval_fbp[["yhat"]]

	##error metrics
	## i will be evaluating the model's performance using MAE, MSE, and RMSLE

	mean_abs_err= (MAE(eval,test_target)/test_target.mean())*100

	rmsle= np.sqrt(MSLE(eval,test_target))

	rmse=np.sqrt(MSE(eval,test_target))

	rmsle
	mean_abs_err
	rmse
	###Our model is working well, so we will go ahead and dump the various components
	final_results= pd.DataFrame({"MAE":mean_abs_err, "RMSLE": rmsle, "RMSE":rmse })
	final_results

	##plotting my outcome
	model.plot(eval_fbp)
	plt.show()

	### I am going to drop my prophet and thhen


	"""in this section, I am going to drop the holidays column and then use the inbuilt Facebook Prophet Holiday
	feature
	"""
	##loading my dataframes again

	##dropping the holiday columns for the new training dataframe
	train_2= train_copy.drop(columns= ["holiday", "locale", "transferred"], axis= 1)

	train_2
	##dropping the holiday columns for the new test dataframe

	test_2= test.drop(columns= ["Unnamed: 0","holiday", "locale", "transferred"], axis= 1)

	test_2

	train_2

	##instatiating my model

	model_2= Prophet(yearly_seasonality= True,
	seasonality_mode= "multiplicative", seasonality_prior_scale=25)

	##adding the holiday effect
	model_2.add_country_holidays(country_name= "ECU")

	##adding my regressors (exogenous variables)

	for col in train_2.drop(columns=["ds", "y"], axis= 1):
	model_2.add_regressor(col, standardize=True, prior_scale=20)


	model_2.fit(train_2)

	eval_2_fbp=model_2.predict(test_2)

	##getting my predicted values

	eval_2= eval_2_fbp[["yhat"]]

	##evaluating my model's performance

	mae_2= (MAE(test_target,eval_2)/test_target.mean()) * 100

	rmsle_2= np.sqrt(MSLE(test_target,eval_2))

	rmse_2= np.sqrt(MSE(test_target,eval_2))

	final_error_2= pd.DataFrame({"MAE":mae_2, "RMSLE": rmsle_2, "RMSE":rmse_2 })

	final_error_2

	final_results

	model_2.plot_components(eval_2_fbp)
	model_2.plot(eval_2_fbp)
	plt.show()

	""" our second model with embedded holiday effects did pretty well by giving us a much lower rmsle than our
	initial model where we used had to hard-encode our holiday effect
	"""
	##saving my Facebook Prophet model
	#joblib.dump(model_2,"Z:/Users/Sonny Otchi/Desktop/models/fbpmodel.joblib")

	"""
	Note: Since we used facebook prophet's inbuilt holiday effect, we will not need to save any of the encoders
	"""