01: remove outliers from data
This commit is contained in:
parent
47164f81d4
commit
0f655c8719
|
@ -20,10 +20,9 @@ import seaborn as sns
|
|||
|
||||
# %% Data
|
||||
data = pd.read_csv("../data/melb_data.csv").dropna()
|
||||
# Ein Outlier, blöder Arsch
|
||||
# TODO: remove outlier from actual data, not just diagram
|
||||
data = data[(data["BuildingArea"] < 1000) ]
|
||||
ax = sns.scatterplot(x=data['BuildingArea'], y=data['Price'])
|
||||
ax.set(xlim=(0, 1000))
|
||||
# ax.set(xlim=(0, 1000)) # brauch ich nicht mehr wenn ich die outlier aus den daten rausschmeiße
|
||||
|
||||
|
||||
# %% linear regression
|
||||
|
|
Loading…
Reference in New Issue