diff --git a/outlier_detection.ipynb b/outlier_detection.ipynb new file mode 100644 index 0000000..c92039c --- /dev/null +++ b/outlier_detection.ipynb @@ -0,0 +1,20 @@ +# Outlier Detection Tutorial + +This notebook explains what outliers are and how to detect them using simple methods. + +An outlier is a data point that is very different from other values in a dataset. +Outliers can affect model performance and data analysis. + +import numpy as np +import pandas as pd + +data = pd.DataFrame({ + "values": [10, 12, 13, 14, 15, 100] +}) + +from scipy import stats + +data["z_score"] = stats.zscore(data["values"]) +data + +#Z-score measures how far a value is from the mean.