ML
1. Write an Python program to perform data preprocessing on given data set. import pandas as pd # Load the dataset from the Excel file into a DataFrame file_path = 'C:\\Users\\datset_noise.xlsx' df = pd.read_excel(file_path, engine='openpyxl') print("Original DataFrame:") print(df.to_string(index=False)) # Step 2: Remove rows with missing values df_no_missing = df.dropna() print("\nDataFrame after removing rows with missing values:") print(df_no_missing.to_string(index=False)) print(f"\nTotal count after removing rows with missing values: {len(df_no_missing)}") # Store rows with missing values df_missing_rows = df[df.isna().any(axis=1)] # Step 3: Remove duplicate rows df_no_duplicates = df_no_missing.drop_duplicates(subset=["Name","DOB","Age","Date of Joining"]) print("\nDataFrame after removing duplicate rows:") print(df_no_duplicates.to_string(index=False)) print(f"\nTotal count aft...