Skip to content
Snippets Groups Projects
Commit a49dedba authored by agshaathalla's avatar agshaathalla
Browse files

data drift

parent 63346f6c
Branches
No related merge requests found
import pandas as pd
def sample_data(input_csv, output_csv, sample_fraction, random_state=None):
data = pd.read_csv(input_csv)
print("Data sebelum sampling:")
print(data.info())
print(data.head())
sampled_data = data.sample(frac=sample_fraction, random_state=random_state)
print("\nData setelah sampling:")
print(sampled_data.info())
print(sampled_data.head())
sampled_data.to_csv(output_csv, index=False)
print(f"\nHasil sampling disimpan ke {output_csv}")
if __name__ == "__main__":
input_csv = "telco_customer_churn.csv"
output_csv = "telco_customer_churn_drift.csv"
sample_fraction = 0.2
random_state = 42
sample_data(input_csv, output_csv, sample_fraction, random_state)
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment