# Packages used
import numpy
from matplotlib import pyplot as pl
from sklearn.linear_model import LinearRegression
import pandas

dat = pandas.read_csv("dat.csv") #Read data

e = dat["Actual duration"].values.reshape(-1,1) #Actual effort (minimum cost to be met to avoid overscoping)

s = dat["Team size"].values.reshape(-1,1) #Actual effort (minimum cost to be met to avoid overscoping)


lr = LinearRegression() #Create LinearRegression instance
lr.fit(s, e) #Load the data into the instance
lobf = lr.predict(s) #Create the line of best fit

pl.scatter(s, e) #Graph the data points
pl.plot(s, lobf, color="red") #Plot the line of best fit
pl.show() #Show the graph
