From d3ae31873d6e9296dc8d75819a737dfdf4468bad Mon Sep 17 00:00:00 2001 From: amilashanaka <dsa.amilashanaka@gmail.com> Date: Tue, 29 Nov 2022 03:18:09 +0000 Subject: [PATCH] prepare data set change datset apperence --- model.py | 25 +++++++++++++++++++++++++ 1 file changed, 25 insertions(+) diff --git a/model.py b/model.py index 738ca0d..b9079bd 100644 --- a/model.py +++ b/model.py @@ -16,6 +16,8 @@ from keras.layers import Dense, LSTM, Dropout import warnings warnings.filterwarnings("ignore") +from datetime import datetime as dt + data = pd.read_csv("data/product__demnd.csv") print(data) @@ -31,3 +33,26 @@ data.dropna(inplace=True) print(data.isnull().sum()) +data.sort_values('Date', ignore_index=True, inplace=True) +print(data.head()) + +data['OrderDemand'] = data['OrderDemand'].str.replace('(',"") +data['OrderDemand'] = data['OrderDemand'].str.replace(')',"") + +data['OrderDemand'] = data['OrderDemand'].astype('int64') + + +# convert the 'Date' column to datetime format +data['Date']= pd.to_datetime(data['Date']) + + +# create Year, Month, Day columns +data['Year'] = data["Date"].dt.year +data['Month'] = data["Date"].dt.month +data['Day'] = data["Date"].dt.day +# i used second way because i think it is more usable for dtypes + +# information about data +print(data.info()) + +print(data["OrderDemand"].describe()) \ No newline at end of file -- GitLab