{"columns":[{"alerts":[],"column":"country_code","extras":{"singletons":0,"top_values":[["AFG",22],["AGO",22],["ALB",22],["ARE",22],["ARG",22],["ARM",22],["ATG",22],["AUS",22],["AUT",22],["AZE",22],["BDI",22],["BEL",22],["BEN",22],["BFA",22],["BGD",22],["BGR",22],["BHR",22],["BHS",22],["BIH",22],["BLR",22]]},"kind":"categorical","n":4070,"n_null":0,"n_unique":185,"null_rate":0.0,"stats":{"cardinality":185,"entropy":7.531381460516311,"entropy_ratio":0.9999999999999999,"top_rate":0.005405405405405406,"top_value":"AFG"}},{"alerts":[],"column":"region","extras":{"singletons":0,"top_values":[["Europe",1100],["Africa",1034],["Americas",748],["Eastern Mediterranean",484],["Western Pacific",484],["South-East Asia",220]]},"kind":"categorical","n":4070,"n_null":0,"n_unique":6,"null_rate":0.0,"stats":{"cardinality":6,"entropy":2.41967068057571,"entropy_ratio":0.9360563953638272,"top_rate":0.2702702702702703,"top_value":"Europe"}},{"alerts":[],"column":"year","extras":{"histogram":{"counts":[185,185,0,185,0,185,0,185,0,185,0,185,0,185,0,185,0,185,0,185,185,0,185,0,185,0,185,0,185,0,185,0,185,0,185,0,185,0,185,185],"edges":[2000.0,2000.525,2001.05,2001.575,2002.1,2002.625,2003.15,2003.675,2004.2,2004.725,2005.25,2005.775,2006.3,2006.825,2007.35,2007.875,2008.4,2008.925,2009.45,2009.975,2010.5,2011.025,2011.55,2012.075,2012.6,2013.125,2013.65,2014.175,2014.7,2015.225,2015.75,2016.275,2016.8,2017.325,2017.85,2018.375,2018.9,2019.425,2019.95,2020.475,2021.0]},"sample":[2020.0,2004.0,2005.0,2016.0,2011.0,2005.0,2006.0,2008.0,2017.0,2018.0,2021.0,2012.0,2004.0,2016.0,2018.0,2005.0,2013.0,2004.0,2000.0,2001.0,2018.0,2010.0,2003.0,2008.0,2003.0,2013.0,2006.0,2014.0,2021.0,2010.0,2014.0,2016.0,2000.0,2001.0,2005.0,2006.0,2007.0,2003.0,2005.0,2009.0,2013.0,2020.0,2021.0,2001.0,2001.0,2003.0,2004.0,2008.0,2002.0,2004.0,2016.0,2019.0,2021.0,2008.0,2011.0,2021.0,2001.0,2011.0,2006.0,2009.0,2018.0,2019.0,2002.0,2006.0,2015.0,2000.0,2002.0,2009.0,2015.0,2021.0,2000.0,2010.0,2014.0,2001.0,2002.0,2010.0,2013.0,2005.0,2008.0,2007.0,2015.0,2017.0,2010.0,2011.0,2003.0,2008.0,2011.0,2000.0,2004.0,2006.0,2015.0,2017.0,2006.0,2008.0,2019.0,2009.0,2000.0,2004.0,2006.0,2004.0,2013.0,2011.0,2020.0,2016.0,2017.0,2003.0,2012.0,2019.0,2019.0,2001.0,2006.0,2019.0,2005.0,2008.0,2012.0,2013.0,2003.0,2008.0,2014.0,2018.0,2019.0,2002.0,2013.0,2001.0,2006.0,2014.0,2015.0,2000.0,2012.0,2013.0,2004.0,2010.0,2011.0,2016.0,2020.0,2005.0,2007.0,2017.0,2000.0,2005.0,2006.0,2009.0,2012.0,2016.0,2018.0,2012.0,2016.0,2019.0,2021.0,2014.0,2021.0,2007.0,2012.0,2015.0,2017.0,2006.0,2007.0,2019.0,2001.0,2005.0,2012.0,2014.0,2020.0,2002.0,2011.0,2012.0,2005.0,2014.0,2019.0,2017.0,2021.0,2011.0,2001.0,2017.0,2003.0,2021.0,2019.0,2004.0,2021.0,2004.0,2009.0,2008.0,2021.0,2006.0,2003.0,2009.0,2010.0,2012.0,2001.0,2006.0,2010.0,2011.0,2014.0,2016.0,2017.0,2016.0,2003.0,2005.0,2014.0,2018.0,2019.0,2021.0,2003.0,2006.0,2013.0,2015.0,2021.0,2008.0,2010.0,2012.0,2014.0,2017.0,2018.0,2021.0,2002.0,2008.0,2000.0,2014.0,2000.0,2001.0,2014.0,2000.0,2006.0,2013.0,2015.0,2018.0,2019.0,2004.0,2007.0,2008.0,2013.0,2015.0,2018.0,2020.0,2021.0,2003.0,2004.0,2002.0,2004.0,2010.0,2018.0,2006.0,2010.0,2013.0,2018.0,2017.0,2018.0,2000.0,2003.0,2013.0,2003.0,2008.0,2009.0,2021.0,2000.0,2002.0,2003.0,2006.0,2013.0,2016.0,2013.0,2021.0,2014.0,2019.0,2007.0,2021.0,2005.0,2004.0,2006.0,2012.0,2013.0,2006.0,2003.0,2007.0,2014.0,2018.0,2013.0,2005.0,2010.0,2004.0,2006.0,2016.0,2019.0,2017.0,2021.0,2014.0,2016.0,2000.0,2004.0,2008.0,2018.0,2013.0,2002.0,2003.0,2009.0,2011.0,2018.0,2002.0,2003.0,2014.0,2015.0,2018.0,2009.0,2016.0,2017.0,2017.0,2018.0,2000.0,2001.0,2008.0,2010.0,2013.0,2019.0,2020.0,2010.0,2011.0,2019.0,2021.0,2012.0,2013.0,2017.0,2018.0,2000.0,2000.0,2008.0,2002.0,2013.0,2017.0,2020.0,2005.0,2021.0,2010.0,2001.0,2014.0,2021.0,2017.0,2015.0,2001.0,2002.0,2010.0,2012.0,2000.0,2016.0,2001.0,2009.0,2014.0,2003.0,2004.0,2005.0,2009.0,2010.0,2015.0,2003.0,2011.0,2019.0,2002.0,2016.0,2017.0,2019.0,2021.0,2000.0,2008.0,2009.0,2012.0,2013.0,2014.0,2016.0,2020.0,2013.0,2019.0,2021.0,2006.0,2003.0,2005.0,2006.0,2010.0,2019.0,2020.0,2001.0,2002.0,2012.0,2003.0,2007.0,2015.0,2003.0,2016.0,2011.0,2013.0,2003.0,2007.0,2015.0,2009.0,2010.0,2002.0,2018.0,2019.0,2005.0,2017.0,2000.0,2008.0,2011.0,2013.0,2015.0,2006.0,2002.0,2008.0,2005.0,2016.0,2010.0,2021.0,2006.0,2010.0,2017.0,2001.0,2000.0,2014.0,2017.0,2018.0,2020.0,2004.0,2012.0,2016.0,2017.0,2020.0,2004.0,2011.0,2003.0,2004.0,2002.0,2005.0,2008.0,2018.0,2016.0,2020.0,2021.0,2006.0,2009.0,2015.0,2004.0,2010.0,2013.0,2016.0,2005.0,2006.0,2020.0,2021.0,2001.0,2007.0,2013.0,2015.0,2003.0,2006.0,2016.0,2001.0,2007.0,2005.0,2010.0,2011.0,2012.0,2014.0,2020.0,2021.0,2013.0,2009.0,2011.0,2018.0,2021.0,2001.0,2004.0,2008.0,2011.0,2012.0,2013.0,2014.0,2009.0,2011.0,2002.0,2005.0,2007.0,2009.0,2010.0,2015.0,2016.0,2000.0,2001.0,2004.0,2003.0,2013.0,2005.0,2018.0,2019.0,2003.0,2019.0,2000.0,2007.0,2010.0,2020.0,2000.0,2018.0,2020.0]},"kind":"numeric","n":4070,"n_null":0,"n_unique":22,"null_rate":0.0,"stats":{"iqr":11.0,"kurtosis":-1.204968944099379,"max":2021.0,"mean":2010.5,"median":2010.5,"min":2000.0,"n_outliers":0,"outlier_rate":0.0,"q1":2005.0,"q3":2016.0,"skew":0.0,"std":6.345068310532454,"zero_rate":0.0}},{"alerts":[],"column":"hale_years","extras":{"histogram":{"counts":[1,2,4,12,13,10,14,18,24,36,38,50,51,46,58,62,85,100,98,114,96,102,115,117,130,124,136,196,217,316,301,256,255,215,177,214,163,70,19,15],"edges":[35.3,36.262499999999996,37.224999999999994,38.1875,39.15,40.1125,41.074999999999996,42.037499999999994,43.0,43.9625,44.925,45.887499999999996,46.849999999999994,47.8125,48.775,49.7375,50.699999999999996,51.662499999999994,52.625,53.5875,54.55,55.5125,56.474999999999994,57.4375,58.4,59.3625,60.325,61.287499999999994,62.25,63.2125,64.175,65.1375,66.1,67.0625,68.025,68.9875,69.94999999999999,70.9125,71.875,72.8375,73.8]},"sample":[51.7,45.4,46.3,53.7,67.0,68.3,68.8,69.3,69.3,69.5,67.3,66.2,63.5,65.5,66.4,65.7,65.9,68.8,67.6,68.0,66.1,51.9,67.5,68.4,50.8,54.1,48.8,53.1,54.6,60.8,62.9,63.4,62.8,62.9,63.5,63.6,63.9,61.8,62.4,64.0,65.1,64.7,61.5,65.9,59.9,60.0,60.3,61.6,62.5,63.0,64.8,65.2,63.8,61.0,61.8,57.4,61.1,63.3,65.6,66.2,66.5,66.3,66.6,67.2,67.1,57.2,58.8,61.8,63.4,64.8,41.3,50.1,53.2,38.5,38.8,42.7,42.9,69.0,69.4,70.0,70.8,71.2,67.9,68.4,63.9,65.9,66.8,44.5,46.0,47.8,53.2,54.3,47.5,48.6,53.5,52.3,63.3,64.5,65.1,56.1,58.6,69.2,68.8,68.2,67.8,68.7,70.6,71.1,68.5,67.7,68.5,57.6,67.8,68.2,69.3,69.4,63.8,63.8,63.7,63.8,64.1,63.4,65.6,63.9,64.7,61.7,61.4,47.7,53.5,53.8,69.5,70.7,70.8,71.4,70.6,63.5,63.8,67.9,44.5,49.9,50.9,54.2,56.7,58.9,59.6,69.1,69.8,70.2,69.9,59.7,57.7,69.3,70.0,70.2,70.5,56.9,56.9,58.2,50.1,51.8,54.3,55.3,68.8,61.9,63.5,63.6,52.7,56.2,57.9,52.8,55.8,49.1,47.3,53.0,68.2,68.6,63.4,59.8,59.3,56.2,57.1,61.7,60.0,66.3,50.3,52.9,35.3,53.2,63.0,64.0,65.0,65.3,66.0,66.3,63.0,59.9,67.4,68.0,69.7,70.3,70.5,70.0,63.1,64.5,66.0,66.1,64.0,59.9,61.0,61.4,60.2,61.2,62.5,61.0,69.6,70.4,68.3,71.2,63.6,63.2,67.1,71.1,71.9,72.7,73.1,73.5,73.6,57.1,57.7,58.9,61.9,63.0,63.9,62.5,61.6,53.5,53.6,67.4,68.1,70.1,72.1,67.8,69.0,69.9,70.8,60.1,60.3,65.0,65.8,66.7,45.4,50.7,51.1,54.0,64.2,63.8,63.8,64.6,64.1,62.7,65.7,61.8,66.2,67.1,38.6,64.2,68.8,61.9,61.7,64.6,64.8,61.6,58.6,59.5,62.6,64.1,55.5,64.4,66.1,64.8,65.0,65.4,65.5,66.5,63.7,52.1,52.9,68.0,68.8,69.5,71.3,58.7,64.6,64.6,66.0,66.5,67.5,56.4,56.8,60.5,60.8,61.8,46.2,49.1,49.7,61.3,61.4,62.2,39.7,47.7,49.9,53.1,55.5,55.7,65.1,65.2,65.5,63.9,53.8,54.1,54.6,53.0,46.6,65.3,65.7,68.3,70.3,70.5,70.2,69.1,71.2,59.7,67.2,69.3,70.0,64.7,56.7,66.2,66.4,66.8,67.1,65.4,69.8,61.0,61.1,61.5,55.8,55.9,56.0,56.7,56.9,57.9,64.9,66.6,67.6,66.8,69.2,67.8,69.4,68.8,55.9,62.4,62.4,63.0,69.3,69.6,69.7,69.4,64.8,64.9,60.9,59.9,61.9,62.3,62.7,64.2,67.9,66.6,62.4,62.2,65.2,56.5,58.8,62.1,45.6,58.5,58.0,58.6,52.8,55.5,58.7,71.9,72.1,56.4,58.0,58.1,45.1,51.6,62.0,44.3,39.2,46.3,47.2,64.4,46.1,49.7,58.2,62.3,63.0,60.3,67.4,68.6,69.8,69.3,41.4,44.6,47.0,64.3,67.1,63.5,56.6,52.3,51.4,62.0,45.7,48.9,49.3,49.6,62.8,57.8,59.3,61.1,59.7,60.3,59.5,63.4,61.9,63.8,62.1,63.5,64.3,63.9,65.2,65.3,66.2,63.6,64.2,66.3,66.5,66.4,48.0,50.5,57.3,43.3,49.3,58.7,61.2,61.8,62.0,61.8,63.0,61.6,66.6,66.4,66.6,66.0,63.9,55.1,56.2,58.0,59.5,59.9,60.5,60.9,63.9,63.6,64.5,64.9,64.8,64.8,64.9,64.8,65.0,57.5,57.5,57.9,61.7,61.7,56.4,56.9,57.4,45.9,56.3,38.9,46.6,49.9,53.9,40.5,51.6,52.2]},"kind":"numeric","n":4070,"n_null":0,"n_unique":345,"null_rate":0.0,"stats":{"iqr":10.100000000000009,"kurtosis":0.027406884427315426,"max":73.8,"mean":61.03022113022113,"median":63.1,"min":35.3,"n_outliers":45,"outlier_rate":0.011056511056511056,"q1":56.3,"q3":66.4,"skew":-0.8235320872525065,"std":7.344160452380039,"zero_rate":0.0}}],"insights":{"errors":[],"insights":[{"confidence":"high","critiques":[],"evidence_keys":["row_count","column_count","columns","kinds"],"featured_charts":[{"caption":"Look for the left-skewed shape and the lower tail of countries with HALE under ~50 years.","column":"hale_years","kind":"histogram"},{"caption":"Note the uneven regional representation, with Europe and Africa contributing the most rows and South-East Asia the fewest.","column":"region","kind":"bar"},{"caption":"Confirm the uniform yearly coverage from 2000 to 2021 that makes this a balanced panel.","column":"year","kind":"histogram"},{"caption":"185 countries each appear ~22 times; useful as a sanity check on panel completeness.","column":"country_code","kind":"length"}],"model":"anthropic:claude-opus-4-7","narrative":"This dataset contains 4,070 rows of WHO Healthy Life Expectancy (HALE) data spanning 185 countries, 6 regions, and 22 years from 2000 to 2021. The panel is balanced \u2014 each country contributes 22 yearly observations \u2014 so the country_code distribution is essentially uniform and not informative on its own. The most interesting variable is hale_years, which ranges from 35.3 to 73.8 with a mean of 61.0 and a left-skewed distribution (skew = -0.82), indicating a long tail of countries with notably lower healthy life expectancy. Regional coverage is uneven, with Europe (1,100 rows) and Africa (1,034) dominating while South-East Asia contributes only 220 rows. Start by examining the hale_years distribution and how it breaks down by region.","scope":"dataset","target":"__global__"},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds ISO 3166-1 alpha-3 country codes, with 185 unique values across 4,070 rows and zero nulls. The distribution is perfectly uniform \u2014 every visible top value appears exactly 22 times and entropy_ratio is 1.0 \u2014 which strongly suggests a panel structure (185 countries \u00d7 22 periods).","role":"foreign_key","scope":"column","target":"country_code","treatment":"Use as a join key to country reference data; pair with a time column to model the panel."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This is a categorical region field with 6 distinct values matching WHO regional groupings (Europe, Africa, Americas, Eastern Mediterranean, Western Pacific, South-East Asia) and no nulls across 4070 rows. Distribution is fairly balanced \u2014 entropy ratio of 0.936 \u2014 with Europe leading at 27% (1100 rows) and South-East Asia trailing at 220. The mix of WHO-style labels suggests this dataset is sourced from or aligned with WHO global health data.","role":"feature","scope":"column","target":"region","treatment":"one-hot or target-encode for modelling; safe to use as a stratification key."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.skew","stats.kurtosis","stats.std","stats.n_outliers"],"model":"anthropic:claude-opus-4-7","narrative":"This column captures the calendar year, spanning 2000 to 2021 with 22 distinct integer values across 4070 rows and no nulls. The distribution is perfectly symmetric (skew 0.0, mean equals median at 2010.5) with negative kurtosis (-1.20), indicating a near-uniform spread across years rather than a concentration in any period. No outliers are flagged.","role":"timestamp","scope":"column","target":"year","treatment":"Treat as a discrete time index for grouping or trend analysis rather than a continuous numeric feature."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.q1","stats.q3","stats.skew","stats.outlier_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Healthy life expectancy in years (HALE), spanning 35.3 to 73.8 with a mean of 61.03 and median 63.1 across 4070 rows. The distribution is left-skewed (skew -0.82), reflecting a long tail of low-HALE observations pulling below the bulk concentrated between Q1=56.3 and Q3=66.4. Only 1.1% outliers and zero nulls, so the column is clean and ready to use.","role":"feature","scope":"column","target":"hale_years","treatment":"Use directly as a numeric feature; consider modelling the left skew if linearity is required."}],"providers":["anthropic:claude-opus-4-7"],"total_usage":{"completion_tokens":1627,"prompt_tokens":4490,"total_tokens":6117}},"language_counts":{},"meta":{"generated_at":"2026-05-01T17:01:32+00:00","mode":"full","row_count":4070,"sampled_rows":4070,"seed":42,"source":"/home/coolhand/datasets/accessibility-atlas/who_hale_long.csv"},"notes":[],"saturn_version":"0.2.0","schema":{"country_code":"categorical","hale_years":"numeric","region":"categorical","year":"numeric"}}
