JEENB
diff --git a/‎__pycache__/models.cpython-39.pyc
-2.74 KB b/‎__pycache__/models.cpython-39.pyc
-2.74 KB
diff --git a/‎models.py
Lines changed: 13 additions & 11 deletions b/‎models.py
Lines changed: 13 additions & 11 deletions
diff --git a/‎received.csv
Lines changed: 1 addition & 0 deletions b/‎received.csv
Lines changed: 1 addition & 0 deletions
diff --git a/‎report/2.png
945 KB b/‎report/2.png
945 KB
diff --git a/‎report/create_report.py
Lines changed: 36 additions & 2 deletions b/‎report/create_report.py
Lines changed: 36 additions & 2 deletions
diff --git a/‎server_data/actual_pred.png
2.25 KB b/‎server_data/actual_pred.png
2.25 KB
diff --git a/‎server_data/compare_error.png
-548 Bytes b/‎server_data/compare_error.png
-548 Bytes
diff --git a/‎server_data/fitting.png
162 Bytes b/‎server_data/fitting.png
162 Bytes
diff --git a/‎server_data/normalqq.png
19.9 KB b/‎server_data/normalqq.png
19.9 KB
diff --git a/‎server_data/report.pdf
808 KB b/‎server_data/report.pdf
808 KB
@@ -72,7 +72,7 @@ def reg_training_model(df, degree = 1, split_ratio = 0.2, email ="dummy"):
 
 
 	##-------------------------------------------------
-	#---------- Accuracy vs Predicted -----------------
+	#---------- Ac vs Predicted -----------------
 	##-------------------------------------------------
 
 	# x axis = actual 
@@ -86,11 +86,12 @@ def reg_training_model(df, degree = 1, split_ratio = 0.2, email ="dummy"):
 	y_= min(min(y_test), min(y_test_pred), min(y_train), min(y_train_pred))
 	x = np.linspace(y_,y,1000)
 	plt.plot(x,x, color = "g")
-
+	plt.xlabel("Actual Results")
+	plt.ylabel("Predicted Results")
 	plt.legend(loc='upper left')	
 	plt.title("Actual VS Predicted")
 	plt.savefig("server_data/actual_pred.png")
-	plt.show()
+
 
 
 	##------------------------------------
@@ -102,7 +103,7 @@ def reg_training_model(df, degree = 1, split_ratio = 0.2, email ="dummy"):
 	plt.ylabel("Mean Square Error")
 	plt.title("Comparing Errors")
 	plt.savefig("server_data/compare_error.png")
-	plt.show()
+
 
 
 	##-------------------------------------------------
@@ -119,20 +120,21 @@ def reg_training_model(df, degree = 1, split_ratio = 0.2, email ="dummy"):
 	plt.legend(loc='upper left')	
 	plt.title("Residual VS Predicted")
 	plt.savefig("server_data/residual_pred.png")
-	plt.show()
+
 
 
 
 	##-------------------------------------------------
 	#---------- Normal Q- Q----------------------------
 	##-------------------------------------------------
-	fig, (ax1, ax2) = plt.subplot(1,2, figsize=(10,6))
+	fig, (ax1, ax2) = plt.subplots(1,2, figsize=(10,6))
 	fig.suptitle('Normal Q-Q')
-	ax1 = sm.qqplot(residual_train, line='45', color ='b')
+	sm.qqplot(residual_train, line='45',  ax = ax1)
 	ax1.set_title("Train")
-	ax2 = sm.qqplot(residual_test, line='45', color = 'r')
-	plt.show()
-	
-
+	ax1.set_ylabel("Standard Residual")
+	sm.qqplot(residual_test, line='45',  ax = ax2)
+	ax2.set_title("Test")
+	ax2.set_ylabel("Standard Residual")
+	plt.savefig("server_data/residual_pred.png")
 	return 0
 
@@ -99,3 +99,4 @@ x,y
 50.039575939875988,85.232007342325673
 48.149858891028863,66.224957888054632
 25.128484647772304,53.454394214850524
+22.23, 21.23
@@ -66,12 +66,46 @@ def create_report():
 	section("Results")
 
 	section("1. Polynomial Fitting")
-	pdf.image("neworignial.jpeg",50,140,w=120, h = 72)
+	pdf.image("./server_data/fitting.png",50,140,w=120, h = 72)
 	pdf.ln(84)
 	multi_line("The above figure represents the regression line being fitted to the training instances. If the regression line passes through all the points then the polynomial degree chosen overfits the data. Similarly, if the line does not touch even a single point, you might be underfitting the training instances.")
 
-
+	pdf.add_page()
+	section("2. Actual vs Predicted")
+	pdf.image("./server_data/actual_pred.png",50,20,w=120, h = 72)
+	pdf.ln(84)
+	multi_line("The above scatter plot represents the spread of predicted and actual scores. Assuming out model perfectly fits the data we can expect the points spread across the y = x line.")
+	line("")
 
+
+	section("3. Residual vs Predicted")
+	pdf.image("./server_data/actual_pred.png",50,140,w=120, h = 72)
+	pdf.ln(84)
+	line("Residual = h(x) - f(x)")
+	line("where,")
+	line("h(x) is the predicted value and f(x) is the actual value")
+	line("")
+	multi_line("The fitted vs residuals plot is mainly useful for investigating: Whether linearity holds. This is indicated by the mean residual value for every fitted value region being close to 0. In R this is indicated by the red line being close to the dashed line. Whether homoskedasticity holds. The spread of residuals should be approximately the same across the x-axis. Whether there are outliers. This is indicated by some extreme residuals that are far from the rest.")
+
+
+	pdf.add_page()
+	section("4. Mean Squared Error")
+	pdf.image("./server_data/compare_error.png",50,20,w=120, h = 72)
+	pdf.ln(80)
+	multi_line("The mean squared error is calculated as the sum of differences in actual and predicted result squared. The lower the MSE the better the model performs.")
+	line("")
+
+	section("4. Normal Q-Q Plots")
+	pdf.image("./server_data/normalqq.png",50,125,w=120, h = 72)
+	pdf.ln(75)
+	line("")
+	multi_line("The Q-Q plot, or quantile-quantile plot, is a graphical tool to help us assess if a set of data plausibly came from some theoretical distribution such as a Normal or exponential. For example, if we run a statistical analysis that assumes our dependent variable is Normally distributed, we can use a Normal Q-Q plot to check that assumption. It's just a visual check, not an air-tight proof, so it is somewhat subjective. But it allows us to see at-a-glance if our assumption is plausible, and if not, how the assumption is violated and what data points contribute to the violation.")
+	line('')
+	multi_line("A Q-Q plot is a scatterplot created by plotting two sets of quantiles against one another. If both sets of quantiles came from the same distribution, we should see the points forming a line that's roughly straight. Here's an example of a Normal Q-Q plot when both sets of quantiles truly come from Normal distributions.")
+
+	pdf.add_page()
+	pdf.image("./report/2.png",0,0,width)
+
 	pdf.output("./server_data/report.pdf", 'F')