diff --git a/Getting Started/linear_regression.py b/Getting Started/linear_regression.py new file mode 100644 index 0000000..c295473 --- /dev/null +++ b/Getting Started/linear_regression.py @@ -0,0 +1,27 @@ +from sklearn import linear_model +from pandas import DataFrame +import pandas as pd +import pandas +import matplotlib.pyplot as plt + +input_data = pandas.read_table("height.csv", header=0, sep=",", names=("weight", "height")) + +plt.scatter(input_data["weight"], input_data["height"]) +#plt.show() + +predictor = pd.DataFrame(input_data, columns=["weight"]) +outcome = pd.DataFrame(input_data, columns=["height"]) + +lm = linear_model.LinearRegression() +lm_model = lm.fit(predictor, outcome) + +predicted_heights = lm.predict(predictor) + +r_squared = lm.score(predictor,outcome) + +print(predicted_heights) +#print("Predicted:") +#print(predicted_heights[0:6]) +#print("Actual:") +#print(outcome[0:6]) +#print(r_squared)