From 3c9c6c97b915a335145ab1bb9eaa38d059e3c994 Mon Sep 17 00:00:00 2001 From: Jeff Moe Date: Thu, 19 Sep 2024 19:46:30 -0600 Subject: [PATCH] Sort by unique counts --- hsparse/parse_csv_contacts.py | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/hsparse/parse_csv_contacts.py b/hsparse/parse_csv_contacts.py index 7f93d37..77b9190 100644 --- a/hsparse/parse_csv_contacts.py +++ b/hsparse/parse_csv_contacts.py @@ -73,7 +73,11 @@ def csv_non_empty(CSV): } unique_counts = {col: df[col].nunique() for col in non_empty_columns.keys()} - sorted_columns = sorted(unique_counts.items(), key=lambda x: x[1], reverse=True) + sorted_columns = sorted( + unique_counts.items(), + key=lambda x: (unique_counts[x[0]], non_empty_columns[x[0]]), + reverse=True, + ) print("Column\tNon-empty values\tUnique values")