From c401479e0a131f6f66e91db3c9f7ccca3796d289 Mon Sep 17 00:00:00 2001 From: amilashanaka <dsa.amilashanaka@gmail.com> Date: Tue, 29 Nov 2022 03:34:27 +0000 Subject: [PATCH] Product Category - Data Frequency --- model.py | 14 +++++++++++++- 1 file changed, 13 insertions(+), 1 deletion(-) diff --git a/model.py b/model.py index b9079bd..47326fc 100644 --- a/model.py +++ b/model.py @@ -55,4 +55,16 @@ data['Day'] = data["Date"].dt.day # information about data print(data.info()) -print(data["OrderDemand"].describe()) \ No newline at end of file +print(data["OrderDemand"].describe()) + +# information about categorical variables +print(data[["ProductCode", "Warehouse", "ProductCategory"]].describe()) + +# Number of samples according to ProductCategory +plt.figure() +plt.barh(data["ProductCategory"].value_counts().index, data["ProductCategory"].value_counts(), color = "b") +plt.xlabel("Frequency") +plt.ylabel("Product Category") +plt.title("Product Category - Data Frequency") +plt.show() +print(f"Number of ProductCategory \n{data['ProductCategory'].value_counts()}") -- GitLab