{"columns":[{"alerts":[{"code":"near_unique","level":"info","message":"100.0% of rows are unique strings"},{"code":"one_word","level":"warn","message":"100.0% rows are a single word"},{"code":"allcaps","level":"info","message":"100.0% rows are all-caps"},{"code":"short_text","level":"info","message":"95th-percentile length under 20 chars"}],"column":"fips","extras":{"language_counts":{},"language_sample_size":3222,"length_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3222,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[4.5,4.525,4.55,4.575,4.6,4.625,4.65,4.675,4.7,4.725,4.75,4.775,4.8,4.825,4.85,4.875,4.9,4.925,4.95,4.975,5.0,5.025,5.05,5.075,5.1,5.125,5.15,5.175,5.2,5.225,5.25,5.275,5.3,5.325,5.35,5.375,5.4,5.425,5.45,5.475,5.5]},"near_unique":true,"sample":["01007","47021","49031","48279","27091","56033","28017","51165","48291","05019","37125","31109","20017","01049","20107","16087","08109","48371","72109","26129","20201","05055","13279","12001","42021","47089","34019","17043","08009","56023","39145","40011","01063","26069","22115","28011","54057","30093","28085","31107","48221","53063","20039","53055","55063","72007","22013","26087","13293","51057"],"top_values":[],"top_words":[["01001",1],["01003",1],["01005",1],["01007",1],["01009",1],["01011",1],["01013",1],["01015",1],["01017",1],["01019",1],["01021",1],["01023",1],["01025",1],["01027",1],["01029",1],["01031",1],["01033",1],["01035",1],["01037",1],["01039",1],["01041",1],["01043",1],["01045",1],["01047",1],["01049",1]],"vocab_skipped":null,"word_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3222,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[0.5,0.5333333333333333,0.5666666666666667,0.6,0.6333333333333333,0.6666666666666666,0.7,0.7333333333333334,0.7666666666666666,0.8,0.8333333333333333,0.8666666666666667,0.9,0.9333333333333333,0.9666666666666667,1.0,1.0333333333333332,1.0666666666666667,1.1,1.1333333333333333,1.1666666666666665,1.2,1.2333333333333334,1.2666666666666666,1.3,1.3333333333333335,1.3666666666666667,1.4,1.4333333333333333,1.4666666666666668,1.5]}},"kind":"text","n":3222,"n_null":0,"n_unique":3222,"null_rate":0.0,"stats":{"allcaps_rate":1.0,"boilerplate_rate":0.0,"duplicate_rate":0.0,"emoji_rate":0.0,"len_max":5,"len_mean":5.0,"len_median":5.0,"len_min":5,"len_p95":5.0,"n_duplicates":0,"n_empty":0,"one_word_rate":1.0,"readability_flesch_mean":121.22000000000004,"url_rate":0.0,"vocab_size":3222,"word_mean":1.0,"word_median":1.0}},{"alerts":[{"code":"near_unique","level":"info","message":"100.0% of rows are unique strings"}],"column":"county_name","extras":{"language_counts":{},"language_sample_size":3222,"length_histogram":{"counts":[26,72,121,190,264,407,420,363,320,240,231,152,139,165,41,28,16,10,5,0,1,1,0,1,1,0,2,0,1,1,0,0,0,0,2,1,0,0,0,1],"edges":[16.0,17.075,18.15,19.225,20.3,21.375,22.45,23.525,24.6,25.674999999999997,26.75,27.825,28.9,29.975,31.049999999999997,32.125,33.2,34.275,35.349999999999994,36.425,37.5,38.575,39.65,40.724999999999994,41.8,42.875,43.95,45.025,46.099999999999994,47.175,48.25,49.324999999999996,50.4,51.475,52.55,53.625,54.699999999999996,55.775,56.85,57.925,59.0]},"near_unique":true,"sample":["Bibb County, Alabama","Cheatham County, Tennessee","Piute County, Utah","Lamb County, Texas","Martin County, Minnesota","Sheridan County, Wyoming","Chickasaw County, Mississippi","Rockingham County, Virginia","Liberty County, Texas","Clark County, Arkansas","Moore County, North Carolina","Lancaster County, Nebraska","Chase County, Kansas","DeKalb County, Alabama","Linn County, Kansas","Washington County, Idaho","Saguache County, Colorado","Pecos County, Texas","Patillas Municipio, Puerto Rico","Ogemaw County, Michigan","Washington County, Kansas","Greene County, Arkansas","Toombs County, Georgia","Alachua County, Florida","Cambria County, Pennsylvania","Jefferson County, Tennessee","Hunterdon County, New Jersey","DuPage County, Illinois","Baca County, Colorado","Lincoln County, Wyoming","Scioto County, Ohio","Blaine County, Oklahoma","Greene County, Alabama","Iosco County, Michigan","Vernon Parish, Louisiana","Bolivar County, Mississippi","Mineral County, West Virginia","Silver Bow County, Montana","Lincoln County, Mississippi","Knox County, Nebraska","Hood County, Texas","Spokane County, Washington","Decatur County, Kansas","San Juan County, Washington","La Crosse County, Wisconsin","Aguas Buenas Municipio, Puerto Rico","Bienville Parish, Louisiana","Lapeer County, Michigan","Upson County, Georgia","Essex County, Virginia"],"top_values":[],"top_words":[["county,",2999],["texas",256],["virginia",189],["georgia",159],["north",155],["carolina",147],["new",131],["dakota",121],["kentucky",120],["missouri",115],["south",113],["kansas",105],["illinois",102],["iowa",101],["tennessee",95],["indiana",93],["nebraska",93],["ohio",91],["minnesota",87],["mississippi",84],["michigan",83],["oklahoma",78],["municipio,",78],["puerto",78],["rico",78]],"vocab_skipped":null,"word_histogram":{"counts":[2492,0,0,0,0,0,0,667,0,0,0,0,0,0,0,57,0,0,0,0,0,0,5,0,0,0,0,0,0,1],"edges":[3.0,3.1333333333333333,3.2666666666666666,3.4,3.533333333333333,3.6666666666666665,3.8,3.9333333333333336,4.066666666666666,4.2,4.333333333333333,4.466666666666667,4.6,4.733333333333333,4.866666666666667,5.0,5.133333333333333,5.266666666666667,5.4,5.533333333333333,5.666666666666666,5.8,5.933333333333334,6.066666666666666,6.2,6.333333333333334,6.466666666666667,6.6,6.733333333333333,6.866666666666667,7.0]}},"kind":"text","n":3222,"n_null":0,"n_unique":3222,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.0,"emoji_rate":0.0,"len_max":59,"len_mean":24.324022346368714,"len_median":24.0,"len_min":16,"len_p95":31.0,"n_duplicates":0,"n_empty":0,"one_word_rate":0.0,"readability_flesch_mean":10.283900000000026,"url_rate":0.0,"vocab_size":1990,"word_mean":3.2482929857231535,"word_median":3.0}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=+2.10"}],"column":"poverty_rate","extras":{"histogram":{"counts":[7,34,106,246,320,354,393,364,306,262,192,149,123,91,52,44,34,23,18,14,6,8,3,8,5,9,4,11,7,8,2,6,5,5,1,0,0,0,1,1],"edges":[1.6,3.218,4.836,6.453999999999999,8.072,9.69,11.307999999999998,12.925999999999998,14.543999999999999,16.162,17.78,19.398,21.016,22.634,24.252,25.87,27.488,29.105999999999998,30.724,32.342,33.96,35.577999999999996,37.196,38.814,40.431999999999995,42.05,43.668,45.286,46.903999999999996,48.522,50.14,51.757999999999996,53.376,54.994,56.611999999999995,58.23,59.848,61.465999999999994,63.083999999999996,64.702,66.32]},"sample":[15.88,14.86,16.62,25.01,22.03,10.92,26.76,9.58,11.55,6.9,18.48,16.88,16.01,13.53,19.99,14.12,13.55,17.56,20.95,26.57,9.15,14.29,18.52,12.32,12.88,12.58,9.0,17.42,8.15,27.07,11.78,6.62,22.53,24.19,15.03,9.21,20.6,11.45,11.69,6.8,9.68,14.04,18.18,12.42,10.49,14.34,26.42,13.68,11.43,15.66,22.45,10.52,22.85,9.26,14.41,27.51,13.18,26.49,13.98,19.93,25.73,7.19,23.55,9.64,21.25,4.6,15.53,19.8,13.56,8.14,13.35,21.86,15.36,16.14,20.32,26.22,15.26,16.03,20.72,28.96,31.34,19.18,22.44,18.15,21.82,14.89,14.58,10.39,6.93,22.14,14.74,18.13,13.38,9.75,14.17,13.38,5.98,22.96,13.45,12.53,13.34,6.65,16.08,11.51,16.37,9.37,13.21,14.14,10.83,12.76,8.91,7.21,12.07,6.06,9.47,6.56,11.83,7.8,13.34,13.02,16.98,5.94,12.21,7.69,14.49,11.33,19.63,8.54,11.89,7.49,13.17,12.79,15.24,20.9,13.61,15.29,11.87,9.93,4.11,7.89,8.79,7.92,10.63,16.9,14.96,10.92,10.12,22.73,7.61,13.66,10.49,7.32,9.93,16.84,23.13,26.29,10.58,26.1,20.28,16.82,21.06,34.04,16.12,22.48,23.83,9.28,13.7,17.17,40.28,16.55,29.7,24.03,26.83,18.05,19.64,14.95,5.83,6.16,7.14,10.97,11.96,15.77,10.25,8.34,16.47,13.25,16.25,23.61,11.08,12.92,7.7,17.07,10.67,11.01,14.15,20.19,16.14,3.78,12.23,11.22,8.58,4.94,8.51,8.71,9.09,10.11,12.36,10.34,8.94,9.63,10.39,8.79,14.02,27.05,23.56,18.38,31.78,19.64,24.85,32.2,22.33,22.82,16.74,23.2,15.76,16.32,28.68,12.32,29.13,14.92,14.52,19.62,9.44,12.06,22.47,15.81,12.34,20.58,17.62,12.99,15.57,16.41,16.57,20.19,10.25,12.19,7.49,14.76,9.27,11.85,5.23,20.37,16.33,12.33,5.43,12.97,10.79,11.1,10.03,6.27,8.68,11.32,10.83,7.97,10.4,9.24,8.0,9.0,11.61,7.47,13.03,7.74,17.77,17.81,17.05,17.54,15.11,12.97,13.01,17.13,11.47,11.59,15.75,6.49,14.12,24.42,9.08,16.95,8.41,5.87,21.09,13.93,22.04,12.43,11.38,29.91,15.99,9.27,11.7,13.32,11.01,15.28,10.72,6.62,10.21,10.28,13.39,6.86,10.85,15.78,13.71,11.74,8.71,10.6,15.43,8.95,13.5,16.08,8.46,10.58,9.42,15.34,5.17,19.07,14.15,12.84,16.04,14.7,11.01,20.84,18.78,14.62,12.52,13.72,7.58,14.87,12.13,12.68,12.99,12.5,11.69,9.86,10.37,13.2,5.63,17.04,13.75,15.31,16.2,9.0,12.35,10.91,11.95,10.84,12.22,11.59,7.77,10.36,20.32,16.97,18.72,17.82,10.92,19.98,27.78,16.68,16.83,14.42,29.6,12.48,10.55,14.52,7.32,23.83,7.44,8.49,7.98,26.01,8.6,12.64,13.92,17.56,13.38,19.71,20.99,14.85,15.63,12.29,5.9,11.94,11.94,7.53,8.79,16.51,6.32,7.45,14.11,12.66,12.66,9.98,8.87,14.5,2.59,7.96,12.54,10.24,11.31,23.44,13.48,9.51,16.37,14.74,4.17,17.31,11.02,6.38,22.35,16.2,13.62,18.39,12.63,37.19,15.68,8.56,11.74,11.81,10.37,12.56,15.24,5.4,7.33,13.25,12.93,9.76,8.02,25.98,10.86,13.04,6.84,16.74,12.99,19.32,5.38,19.91,17.21,8.82,17.32,10.0,13.46,17.53,22.21,17.36,19.47,9.43,16.09,6.84,8.45,11.64,18.85,10.99,8.63,10.94,11.04,19.18,18.77,16.35,21.08,17.83,20.29,16.64,8.23,10.98,9.8,12.78,12.71,14.69,11.78,11.58,9.56,6.91,13.56,13.24,4.95,16.08,18.34,8.68,8.07,42.15,45.61,23.52,47.36,37.12,55.97,52.81,39.12,45.35,52.02,48.49,54.07,43.67]},"kind":"numeric","n":3222,"n_null":0,"n_unique":1719,"null_rate":0.0,"stats":{"iqr":7.75,"kurtosis":6.890992451669181,"max":66.32,"mean":15.100406579764124,"median":13.55,"min":1.6,"n_outliers":137,"outlier_rate":0.04252017380509,"q1":10.16,"q3":17.91,"skew":2.0959367375026883,"std":7.705602319057618,"zero_rate":0.0}}],"insights":{"errors":[],"insights":[{"confidence":"high","critiques":[],"evidence_keys":["row_count","column_count","columns.poverty_rate.stats","columns.county_name.top_words","columns.fips.n_unique"],"featured_charts":[{"caption":"Look for the right-skewed tail above ~28% where the 137 high-poverty outlier counties sit.","column":"poverty_rate","kind":"histogram"},{"caption":"Top words show which states dominate the county list, led by Texas, Virginia, and Georgia.","column":"county_name","kind":"bar"},{"caption":"Name length is tight (median 24 chars) \u2014 useful as a sanity check that entries follow a consistent 'X County, State' format.","column":"county_name","kind":"length"}],"model":"anthropic:claude-opus-4-7","narrative":"This dataset contains 3,222 rows describing U.S. county-level poverty, with three columns: a FIPS code, a county name, and a poverty rate. Each row is a unique county (3,222 unique FIPS codes and county names), so the analytical signal lives in the poverty_rate column. Poverty rates range from 1.6% to 66.32% with a mean of 15.1% and median of 13.55%, and the distribution is right-skewed (skew \u2248 2.10) with 137 outliers on the high end. The county_name field also reveals geographic concentration, with Texas (256), Virginia (189), and Georgia (159) contributing the most counties. Start by examining the shape of poverty_rate and which states the high-poverty outliers cluster in.","scope":"dataset","target":"__global__"},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.len_min","stats.len_max","stats.len_mean","stats.one_word_rate","stats.allcaps_rate","stats.duplicate_rate","stats.vocab_size","top_words"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds 5-character FIPS codes uniquely identifying each of the 3222 rows (n_unique equals n, null_rate 0). Every value is exactly 5 characters, one word, all-caps/numeric, with zero duplicates or empties. Sample values like 01001, 01003, 01005 match the standard US county FIPS encoding (state+county).","role":"identifier","scope":"column","target":"fips","treatment":"Treat as a county-level key; left-join on this id and exclude from modelling features."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.len_min","stats.len_median","stats.len_max","stats.duplicate_rate","top_words","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This is a county identifier string, likely formatted as \"<County Name> County, <State>\" \u2014 \"county,\" appears in 2999 of 3222 rows and Texas (256), Virginia (189), and Georgia (159) lead the state mentions. Every one of the 3222 values is unique with zero nulls or duplicates, and lengths cluster tightly (min 16, median 24, max 59), consistent with a clean US county roster. The 223 rows lacking the \"county,\" token are worth checking \u2014 likely parishes, boroughs, or independent cities.","role":"identifier","scope":"column","target":"county_name","treatment":"Split into county and state fields and use as a join key rather than a model feature."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.q1","stats.q3","stats.iqr","stats.std","stats.skew","stats.kurtosis","stats.n_outliers","stats.outlier_rate","stats.zero_rate","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This is a county- or tract-level poverty rate expressed as a percentage, ranging from 1.6 to 66.32 with a median of 13.55 and IQR of 7.75. The distribution is right-skewed (skew 2.10, kurtosis 6.89) with 137 high outliers (4.25%) reflecting pockets of severe poverty well above the typical 10\u201318% band. No nulls or zeros, and 1719 unique values across 3222 rows suggest one record per geographic unit.","role":"feature","scope":"column","target":"poverty_rate","treatment":"Apply a log or sqrt transform before regression to tame the right skew."}],"providers":["anthropic:claude-opus-4-7"],"total_usage":{"completion_tokens":1429,"prompt_tokens":4396,"total_tokens":5825}},"language_counts":{},"meta":{"generated_at":"2026-05-01T16:54:09+00:00","mode":"full","row_count":3222,"sampled_rows":3222,"seed":42,"source":"/home/coolhand/html/datavis/data_trove/cache/healthcare_data/poverty_data_20260121.parquet"},"notes":[],"saturn_version":"0.2.0","schema":{"county_name":"text","fips":"text","poverty_rate":"numeric"}}
