AI-Supply-chain-Beta / utils /preprocessing.py
Callmebowoo-22's picture
Update utils/preprocessing.py
581242d verified
raw
history blame contribute delete
464 Bytes
import pandas as pd
from sklearn.ensemble import IsolationForest
def clean_data(file):
# Baca dan format data
df = pd.read_csv(file)
df['tanggal'] = pd.to_datetime(df['tanggal'])
df = df.sort_values('tanggal').reset_index(drop=True)
# Deteksi anomali
clf = IsolationForest(contamination=0.05, random_state=42)
df['anomali'] = clf.fit_predict(df[['demand', 'supply']])
return df[df['anomali'] == 1].drop('anomali', axis=1)