from google.colab import data_table import pandas as pd df = pd.read_csv('PHC_ISS_TOOL_Q2_OCT_11_V2_2022_results_Mon_7_42.csv') print(df.shape) newDF = df["grp1:facilityDetails:fac.tl"] + df["grp2:ggp1:ntl_3"] df["Facilities_Combined"]= df["grp1:facilityDetails:fac.tl"].astype(str) + df["grp2:ggp1:ntl_3"].astype(str) df["Facilities_Combined"]= df["Facilities_Combined"].str.replace("nan","") df = df.sort_values('ab2', ascending=False) df.groupby(["Facilities_Combined"]).first().reset_index() NewDF = df.groupby(["Facilities_Combined"]).first().reset_index() NewDF.to_csv('PHC_ISS_TOOL_Q2_OCT_11_V2_2022_results.csv')