Õunte andmed võeti veebiaadressilt
Anomaaliad püüti leida meetoditega
from azureml import Workspace
ws = Workspace()
experiment = ws.experiments['66e373b2084d4ffa9395c0e34ce9ccaa.f-id.e773e947bd7d4c68b4da26e992d0122f']
ds = experiment.get_intermediate_dataset(
node_id='ebd1c86f-2ee7-47f3-b8d9-428740f5e5d8-36086',
port_name='Results dataset',
data_type_id='GenericCSV'
)
frame = ds.to_dataframe()
frame.head()
frame.tail()
import matplotlib.pyplot as plt
plt.scatter(frame.august, frame.september)
plt.show()
plt.scatter(frame.august, frame.september, c=frame.Label, edgecolors="none")
plt.show()
frame["Scored Probabilities"]
frame["Scored Probabilities"].mean()
tulp=frame["Scored Probabilities"]
frame.normskoor=(tulp-tulp.min())/(tulp.max()-tulp.min())
frame.normskoor.max()
plt.scatter(frame.august, frame.september, c=frame.Label, s=frame.normskoor*20+0.5, edgecolors="none")
plt.show()
tavalised=frame[frame.Label==1][["august", "september"]]
plt.scatter(tavalised.august, tavalised.september, edgecolor="none")
plt.title("Õunte suurused (cm)")
plt.xlabel("august")
plt.ylabel("september")
plt.xlim([0, 10])
plt.ylim([0, 10])
plt.plot([tavalised.august.mean(), tavalised.august.mean()], [0, tavalised.september.max()],
linewidth=0.6, linestyle="dotted", color="gray")
#Tõmmake septembri keskmist näitav horisontaaljoon
plt.plot( [0, tavalised.august.max()], [tavalised.september.mean(), tavalised.september.mean()],
linewidth=0.6, linestyle="dotted", color="gray")
plt.show()