Count unique values per column

This commit is contained in:
Jeff Moe 2024-09-19 19:26:23 -06:00
parent 5b02a6198f
commit e08dfc02f7

View file

@ -78,11 +78,15 @@ def csv_non_empty(CSV):
col: df[col].count() for col in df.columns if not df[col].isnull().all()
}
sorted_columns = sorted(non_empty_columns.items(), key=lambda x: x[1], reverse=True)
unique_counts = {col: df[col].nunique() for col in non_empty_columns.keys()}
sorted_columns = sorted(unique_counts.items(), key=lambda x: x[1], reverse=True)
print("Column\tNon-empty values\tUnique values")
if sorted_columns:
for col, count in sorted_columns:
print(f"{col}: {count}")
for col, unique_count in sorted_columns:
count = non_empty_columns[col]
print(f"{col}\t{count}\t{unique_count}")
else:
print("No non-empty values found.")