{"columns":[{"alerts":[],"column":"id","extras":{"histogram":{"counts":[743,469,305,306,268,202,198,176,119,81,89,146,254,215,191,105,77,85,98,91,113,90,90,84,71,80,10,33,70,92,18,78,47,65,42,8,33,45,50,74],"edges":[60.0,2051.275,4042.55,6033.825000000001,8025.1,10016.375,12007.650000000001,13998.925000000001,15990.2,17981.475000000002,19972.75,21964.025,23955.300000000003,25946.575,27937.850000000002,29929.125,31920.4,33911.675,35902.950000000004,37894.225,39885.5,41876.775,43868.05,45859.325000000004,47850.600000000006,49841.875,51833.15,53824.425,55815.700000000004,57806.975000000006,59798.25,61789.525,63780.8,65772.075,67763.35,69754.625,71745.90000000001,73737.175,75728.45,77719.725,79711.0]},"sample":[35293.0,39620.0,37094.0,3296.0,8679.0,75309.0,26604.0,1255.0,2917.0,1261.0,78863.0,55195.0,41981.0,36623.0,1028.0,1606.0,11549.0,47536.0,24818.0,3032.0,36178.0,62851.0,37010.0,62595.0,802.0,166.0,63033.0,1664.0,147.0,2960.0,69315.0,3798.0,2141.0,1665.0,11519.0,1794.0,6961.0,8345.0,8487.0,2182.0,27844.0,6854.0,1742.0,13287.0,22500.0,4886.0,8059.0,3421.0,2919.0,5160.0,2248.0,36070.0,27983.0,79711.0,2844.0,3027.0,6824.0,2861.0,5637.0,1792.0,6971.0,25009.0,14338.0,6706.0,13419.0,16722.0,23974.0,10980.0,4649.0,7676.0,2309.0,348.0,15273.0,23065.0,12802.0,880.0,6164.0,6782.0,7225.0,12904.0,2667.0,513.0,1368.0,6755.0,1370.0,1372.0,32905.0,76534.0,18333.0,28720.0,27076.0,13313.0,41503.0,27587.0,45137.0,18065.0,37203.0,721.0,38893.0,35940.0,246.0,42978.0,6992.0,1030.0,42726.0,33764.0,5369.0,8935.0,7627.0,43381.0,43162.0,19232.0,23570.0,19421.0,14525.0,7004.0,26822.0,8454.0,56061.0,18377.0,9465.0,78583.0,4987.0,28386.0,15416.0,24693.0,13768.0,8460.0,2062.0,3085.0,71863.0,65924.0,57765.0,4741.0,42150.0,30367.0,18059.0,2805.0,35427.0,40842.0,10879.0,29448.0,11295.0,15019.0,40314.0,37522.0,43348.0,23418.0,37697.0,49302.0,27042.0,3472.0,28533.0,24354.0,27374.0,13070.0,42794.0,50965.0,50502.0,57303.0,42140.0,19910.0,23537.0,292.0,2464.0,29674.0,29891.0,2470.0,15374.0,14845.0,44111.0,35883.0,6394.0,76464.0,5532.0,1311.0,25860.0,26790.0,2363.0,10765.0,2368.0,26605.0,5678.0,2425.0,3269.0,24413.0,1459.0,78973.0,75126.0,25137.0,7651.0,232.0,30789.0,23929.0,32924.0,908.0,29675.0,55598.0,44437.0,46534.0,58484.0,31860.0,46401.0,22802.0,35387.0,14828.0,21271.0,43519.0,26544.0,30090.0,30089.0,35868.0,34990.0,43588.0,7275.0,29409.0,57401.0,31025.0,17939.0,22973.0,2554.0,28023.0,2953.0,8351.0,77435.0,14493.0,1049.0,27991.0,18221.0,41411.0,23367.0,19655.0,59346.0,12122.0,27167.0,6775.0,42742.0,40087.0,6194.0,48339.0,16294.0,48530.0,5085.0,15610.0,1135.0,1136.0,14237.0,4116.0,4421.0,28080.0,18278.0,23836.0,65664.0,1530.0,15615.0,5909.0,48354.0,1428.0,63728.0,459.0,66051.0,16486.0,12825.0,45098.0,22192.0,28886.0,26460.0,3399.0,4986.0,1451.0,1453.0,43285.0,23856.0,5047.0,22561.0,12709.0,68896.0,5326.0,15144.0,11841.0,16540.0,20363.0,1601.0,9750.0,9212.0,3336.0,78751.0,77563.0,4201.0,26011.0,65305.0,12669.0,63981.0,51962.0,41232.0,30548.0,4952.0,4731.0,10925.0,27613.0,6330.0,4960.0,33979.0,10863.0,9537.0,6313.0,23980.0,4972.0,58458.0,10421.0,5267.0,23637.0,63286.0,27206.0,59235.0,24512.0,23733.0,24967.0,4532.0,26226.0,4081.0,71794.0,56829.0,6644.0,23628.0,26005.0,650.0,14841.0,659.0,9276.0,2900.0,1720.0,11886.0,412.0,666.0,9534.0,9109.0,8680.0,3050.0,65789.0,674.0,683.0,684.0,15067.0,116.0,25907.0,15746.0,64019.0,7148.0,856.0,2932.0,3122.0,3551.0,3565.0,3002.0,26888.0,48013.0,3572.0,8000.0,16734.0,789.0,13673.0,24235.0,78786.0,1445.0,29455.0,7215.0,29794.0,6478.0,10220.0,7326.0,10740.0,6418.0,77199.0,58593.0,20231.0,6445.0,11682.0,10783.0,29244.0,6461.0,77793.0,30430.0,1632.0,30570.0,638.0,27768.0,50045.0,26473.0,63243.0,40420.0,15627.0,7604.0,9385.0,6941.0,12314.0,41621.0,9036.0,10273.0,14376.0,10157.0,8547.0,39137.0,4143.0,57754.0,7670.0,6007.0,10591.0,9315.0,71803.0,16470.0,1949.0,396.0,14732.0,18623.0,17730.0,55306.0,36591.0,36072.0,30462.0,27682.0,79672.0,1109.0,6058.0,10091.0,1723.0,66120.0,20923.0,42448.0,9373.0,57781.0,945.0,51753.0,14350.0,70737.0,5136.0,9175.0,47107.0,24772.0,4737.0,24714.0,43823.0,45423.0,48777.0,30459.0,15135.0,13487.0,9392.0,23300.0,63900.0,12655.0,1685.0,24310.0,72287.0,11930.0,59331.0,8456.0,38224.0,391.0,1671.0,39858.0,10354.0,20435.0,1917.0,62354.0,63451.0,17539.0,12997.0,33908.0,47225.0,34043.0,25989.0,23762.0,16204.0,20863.0,50469.0,20101.0,19841.0,79117.0,75925.0,43211.0,43915.0,50982.0,41062.0,2804.0,25470.0,45418.0,59659.0,19472.0,1240.0,1244.0,798.0,43994.0,2448.0,17142.0,2423.0,15141.0,15343.0,1486.0,1293.0]},"kind":"numeric","n":5411,"n_null":0,"n_unique":5411,"null_rate":0.0,"stats":{"iqr":31464.0,"kurtosis":-0.15101399407349625,"max":79711.0,"mean":23288.121604139717,"median":16598.0,"min":60.0,"n_outliers":0,"outlier_rate":0.0,"q1":4898.5,"q3":36362.5,"skew":0.9108865161140566,"std":21383.079149017754,"zero_rate":0.0}},{"alerts":[],"column":"state","extras":{"singletons":0,"top_values":[["Washington",631],["California",431],["Ohio",317],["Florida",314],["Oregon",253],["Illinois",239],["Texas",238],["Michigan",217],["Missouri",161],["Georgia",135],["Colorado",128],["Pennsylvania",125],["British Columbia",122],["New York",116],["Kentucky",115],["Arkansas",104],["Tennessee",104],["West Virginia",104],["Oklahoma",101],["Idaho",99]]},"kind":"categorical","n":5411,"n_null":0,"n_unique":53,"null_rate":0.0,"stats":{"cardinality":53,"entropy":5.025141117002036,"entropy_ratio":0.8773063726816794,"top_rate":0.11661430419515802,"top_value":"Washington"}},{"alerts":[],"column":"state_code","extras":{"singletons":0,"top_values":[["wa",631],["ca",431],["oh",317],["fl",314],["or",253],["il",239],["tx",238],["mi",217],["mo",161],["ga",135],["co",128],["pa",125],["ca-bc",122],["ny",116],["ky",115],["ar",104],["tn",104],["wv",104],["ok",101],["id",99]]},"kind":"categorical","n":5411,"n_null":0,"n_unique":53,"null_rate":0.0,"stats":{"cardinality":53,"entropy":5.025141117002036,"entropy_ratio":0.8773063726816794,"top_rate":0.11661430419515802,"top_value":"wa"}},{"alerts":[{"code":"one_word","level":"warn","message":"100.0% rows are a single word"},{"code":"short_text","level":"info","message":"95th-percentile length under 20 chars"},{"code":"duplicates","level":"warn","message":"81.1% duplicate strings"}],"column":"county","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[338,0,0,0,0,28,457,0,640,0,1110,0,802,916,0,608,0,301,0,62,94,0,5,0,24,0,16,3,0,3,0,0,0,3,0,0,0,0,0,1],"edges":[0.0,0.575,1.15,1.7249999999999999,2.3,2.875,3.4499999999999997,4.0249999999999995,4.6,5.175,5.75,6.324999999999999,6.8999999999999995,7.475,8.049999999999999,8.625,9.2,9.774999999999999,10.35,10.924999999999999,11.5,12.075,12.649999999999999,13.225,13.799999999999999,14.374999999999998,14.95,15.524999999999999,16.099999999999998,16.674999999999997,17.25,17.825,18.4,18.974999999999998,19.549999999999997,20.125,20.7,21.275,21.849999999999998,22.424999999999997,23.0]},"near_unique":false,"sample":["Bibb","Houston","Lewis","Cowlitz","Montmorency","","Cass","Skamania","Ferry","Navajo","Portage","Madison","Edgar","Clay","Logan","Dade","Los+Angeles","King","","Chippewa","Saline","Yavapai","San+Juan","Mono","Jefferson","Palo+Pinto","Montgomery","Hernando","El+Dorado","","Grant","","Josephine","Berkshire","Lee","","Pendleton","Passaic","St.+Louis","Essex","Clallam","Barbour","Cook","Yakima","Polk","","Jackson","Essex","Park","Pierce"],"top_values":[["",338],["Pierce",80],["Jefferson",57],["Lewis",55],["Washington",52],["Snohomish",51],["Humboldt",50],["Skamania",49],["Jackson",48],["Polk",42],["King",41],["Marion",39],["Madison",38],["Montgomery",38],["Grays+Harbor",37],["Lake",36],["Tuolumne",36],["Coconino",33],["Siskiyou",31],["Mason",31]],"top_words":[["pierce",80],["jefferson",57],["lewis",55],["washington",52],["snohomish",51],["humboldt",50],["skamania",49],["jackson",48],["polk",42],["king",41],["marion",39],["madison",38],["montgomery",38],["grays+harbor",37],["lake",36],["tuolumne",36],["coconino",33],["siskiyou",31],["mason",31],["warren",30],["monroe",28],["shasta",28],["douglas",28],["clackamas",28],["el+dorado",26]],"vocab_skipped":null,"word_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,5411,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[0.5,0.5333333333333333,0.5666666666666667,0.6,0.6333333333333333,0.6666666666666666,0.7,0.7333333333333334,0.7666666666666666,0.8,0.8333333333333333,0.8666666666666667,0.9,0.9333333333333333,0.9666666666666667,1.0,1.0333333333333332,1.0666666666666667,1.1,1.1333333333333333,1.1666666666666665,1.2,1.2333333333333334,1.2666666666666666,1.3,1.3333333333333335,1.3666666666666667,1.4,1.4333333333333333,1.4666666666666668,1.5]}},"kind":"text","n":5411,"n_null":0,"n_unique":1022,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.8111254851228978,"emoji_rate":0.0,"len_max":23,"len_mean":6.620957309184994,"len_median":7.0,"len_min":0,"len_p95":10.0,"n_duplicates":4389,"n_empty":338,"one_word_rate":1.0,"readability_flesch_mean":16.89670000000003,"url_rate":0.0,"vocab_size":1020,"word_mean":1.0,"word_median":1.0}},{"alerts":[{"code":"near_unique","level":"info","message":"100.0% of rows are unique strings"},{"code":"one_word","level":"warn","message":"100.0% rows are a single word"},{"code":"url_heavy","level":"info","message":"100.0% rows contain a URL"}],"column":"url","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[11,0,0,0,0,0,0,0,0,0,0,0,0,288,0,0,0,0,0,0,0,0,0,0,0,0,1789,0,0,0,0,0,0,0,0,0,0,0,0,3323],"edges":[46.0,46.075,46.15,46.225,46.3,46.375,46.45,46.525,46.6,46.675,46.75,46.825,46.9,46.975,47.05,47.125,47.2,47.275,47.35,47.425,47.5,47.575,47.65,47.725,47.8,47.875,47.95,48.025,48.1,48.175,48.25,48.325,48.4,48.475,48.55,48.625,48.7,48.775,48.85,48.925,49.0]},"near_unique":true,"sample":["https://www.bfro.net/GDB/show_report.asp?id=21714","https://www.bfro.net/GDB/show_report.asp?id=7604","https://www.bfro.net/GDB/show_report.asp?id=12803","https://www.bfro.net/GDB/show_report.asp?id=55658","https://www.bfro.net/GDB/show_report.asp?id=27009","https://www.bfro.net/GDB/show_report.asp?id=43994","https://www.bfro.net/GDB/show_report.asp?id=14942","https://www.bfro.net/GDB/show_report.asp?id=21473","https://www.bfro.net/GDB/show_report.asp?id=25722","https://www.bfro.net/GDB/show_report.asp?id=29358","https://www.bfro.net/GDB/show_report.asp?id=4969","https://www.bfro.net/GDB/show_report.asp?id=454","https://www.bfro.net/GDB/show_report.asp?id=33911","https://www.bfro.net/GDB/show_report.asp?id=42692","https://www.bfro.net/GDB/show_report.asp?id=30203","https://www.bfro.net/GDB/show_report.asp?id=1719","https://www.bfro.net/GDB/show_report.asp?id=14953","https://www.bfro.net/GDB/show_report.asp?id=26403","https://www.bfro.net/GDB/show_report.asp?id=71929","https://www.bfro.net/GDB/show_report.asp?id=25451","https://www.bfro.net/GDB/show_report.asp?id=13070","https://www.bfro.net/GDB/show_report.asp?id=12266","https://www.bfro.net/GDB/show_report.asp?id=32905","https://www.bfro.net/GDB/show_report.asp?id=65849","https://www.bfro.net/GDB/show_report.asp?id=1134","https://www.bfro.net/GDB/show_report.asp?id=19666","https://www.bfro.net/GDB/show_report.asp?id=15492","https://www.bfro.net/GDB/show_report.asp?id=22074","https://www.bfro.net/GDB/show_report.asp?id=6639","https://www.bfro.net/GDB/show_report.asp?id=20758","https://www.bfro.net/GDB/show_report.asp?id=7687","https://www.bfro.net/GDB/show_report.asp?id=1294","https://www.bfro.net/GDB/show_report.asp?id=6655","https://www.bfro.net/GDB/show_report.asp?id=49697","https://www.bfro.net/GDB/show_report.asp?id=27323","https://www.bfro.net/GDB/show_report.asp?id=77435","https://www.bfro.net/GDB/show_report.asp?id=13122","https://www.bfro.net/GDB/show_report.asp?id=10918","https://www.bfro.net/GDB/show_report.asp?id=35281","https://www.bfro.net/GDB/show_report.asp?id=10289","https://www.bfro.net/GDB/show_report.asp?id=10091","https://www.bfro.net/GDB/show_report.asp?id=13141","https://www.bfro.net/GDB/show_report.asp?id=39851","https://www.bfro.net/GDB/show_report.asp?id=1689","https://www.bfro.net/GDB/show_report.asp?id=45418","https://www.bfro.net/GDB/show_report.asp?id=12100","https://www.bfro.net/GDB/show_report.asp?id=38440","https://www.bfro.net/GDB/show_report.asp?id=6631","https://www.bfro.net/GDB/show_report.asp?id=35596","https://www.bfro.net/GDB/show_report.asp?id=1685"],"top_values":[],"top_words":[["https://www.bfro.net/gdb/show_report.asp?id=75577",1],["https://www.bfro.net/gdb/show_report.asp?id=71896",1],["https://www.bfro.net/gdb/show_report.asp?id=67423",1],["https://www.bfro.net/gdb/show_report.asp?id=1783",1],["https://www.bfro.net/gdb/show_report.asp?id=26513",1],["https://www.bfro.net/gdb/show_report.asp?id=27067",1],["https://www.bfro.net/gdb/show_report.asp?id=21714",1],["https://www.bfro.net/gdb/show_report.asp?id=43963",1],["https://www.bfro.net/gdb/show_report.asp?id=50178",1],["https://www.bfro.net/gdb/show_report.asp?id=8921",1],["https://www.bfro.net/gdb/show_report.asp?id=1830",1],["https://www.bfro.net/gdb/show_report.asp?id=45464",1],["https://www.bfro.net/gdb/show_report.asp?id=42939",1],["https://www.bfro.net/gdb/show_report.asp?id=26886",1],["https://www.bfro.net/gdb/show_report.asp?id=49238",1],["https://www.bfro.net/gdb/show_report.asp?id=24451",1],["https://www.bfro.net/gdb/show_report.asp?id=43402",1],["https://www.bfro.net/gdb/show_report.asp?id=1907",1],["https://www.bfro.net/gdb/show_report.asp?id=42692",1],["https://www.bfro.net/gdb/show_report.asp?id=22969",1],["https://www.bfro.net/gdb/show_report.asp?id=273",1],["https://www.bfro.net/gdb/show_report.asp?id=47975",1],["https://www.bfro.net/gdb/show_report.asp?id=44386",1],["https://www.bfro.net/gdb/show_report.asp?id=27568",1],["https://www.bfro.net/gdb/show_report.asp?id=577",1]],"vocab_skipped":null,"word_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,5411,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[0.5,0.5333333333333333,0.5666666666666667,0.6,0.6333333333333333,0.6666666666666666,0.7,0.7333333333333334,0.7666666666666666,0.8,0.8333333333333333,0.8666666666666667,0.9,0.9333333333333333,0.9666666666666667,1.0,1.0333333333333332,1.0666666666666667,1.1,1.1333333333333333,1.1666666666666665,1.2,1.2333333333333334,1.2666666666666666,1.3,1.3333333333333335,1.3666666666666667,1.4,1.4333333333333333,1.4666666666666668,1.5]}},"kind":"text","n":5411,"n_null":0,"n_unique":5411,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.0,"emoji_rate":0.0,"len_max":49,"len_mean":48.55682868231381,"len_median":49.0,"len_min":46,"len_p95":49.0,"n_duplicates":0,"n_empty":0,"one_word_rate":1.0,"readability_flesch_mean":-301.7799999999999,"url_rate":1.0,"vocab_size":5411,"word_mean":1.0,"word_median":1.0}},{"alerts":[],"column":"month","extras":{"singletons":10,"top_values":[["August",634],["October",632],["July",618],["September",515],["June",468],["November",458],["May",303],["April",259],["December",233],["January",228],["Summer",217],["March",201],["February",163],["Fall",129],["Spring",96],["Winter",57],["Late",6],["about",6],["mid",5],["or",5]]},"kind":"categorical","n":5411,"n_null":160,"n_unique":32,"null_rate":0.029569395675475882,"stats":{"cardinality":32,"entropy":3.8072052455185728,"entropy_ratio":0.7614410491037146,"top_rate":0.12073890687488098,"top_value":"August"}},{"alerts":[],"column":"year","extras":{"histogram":{"counts":[1,0,0,0,0,1,0,0,0,1,1,0,2,2,2,2,4,2,5,4,15,13,18,24,53,120,158,331,307,257,224,195,380,610,679,622,616,355,220,130],"edges":[1870.0,1873.875,1877.75,1881.625,1885.5,1889.375,1893.25,1897.125,1901.0,1904.875,1908.75,1912.625,1916.5,1920.375,1924.25,1928.125,1932.0,1935.875,1939.75,1943.625,1947.5,1951.375,1955.25,1959.125,1963.0,1966.875,1970.75,1974.625,1978.5,1982.375,1986.25,1990.125,1994.0,1997.875,2001.75,2005.625,2009.5,2013.375,2017.25,2021.125,2025.0]},"sample":[1978.0,2013.0,2007.0,1993.0,1986.0,2022.0,2009.0,1998.0,1995.0,1990.0,2025.0,2021.0,2014.0,2013.0,2000.0,1981.0,1995.0,1972.0,2014.0,2000.0,1994.0,1973.0,1978.0,2011.0,2001.0,1977.0,1968.0,1983.0,2000.0,1995.0,1968.0,2003.0,2000.0,1999.0,1995.0,1992.0,1965.0,1961.0,1991.0,1980.0,1972.0,1989.0,2002.0,1992.0,1963.0,1978.0,1974.0,1984.0,2003.0,2003.0,1975.0,2019.0,1970.0,1970.0,1987.0,2002.0,1992.0,1998.0,1984.0,1966.0,1986.0,1980.0,1962.0,1994.0,2003.0,2007.0,2006.0,2006.0,2006.0,2001.0,1983.0,1963.0,2020.0,1971.0,2005.0,2003.0,2006.0,1987.0,2014.0,2008.0,2001.0,2005.0,1987.0,1991.0,2000.0,2004.0,1996.0,2024.0,1990.0,2010.0,2012.0,2015.0,1972.0,2006.0,2005.0,2006.0,1986.0,1997.0,2010.0,1998.0,1978.0,2018.0,1963.0,2001.0,2013.0,2012.0,1978.0,1985.0,1984.0,2010.0,2011.0,2005.0,2002.0,1999.0,1956.0,1993.0,2009.0,1985.0,1996.0,2013.0,1997.0,2018.0,1982.0,1983.0,2020.0,2006.0,1995.0,1995.0,1975.0,2021.0,2020.0,2017.0,1969.0,2008.0,1964.0,1998.0,1975.0,2012.0,1978.0,1975.0,1997.0,1984.0,2011.0,1983.0,2013.0,2012.0,1989.0,2008.0,1994.0,2017.0,2011.0,1977.0,2006.0,1975.0,1999.0,2009.0,2014.0,2010.0,1998.0,2014.0,2008.0,1970.0,1968.0,2004.0,2010.0,2009.0,1979.0,2000.0,1988.0,1985.0,1970.0,2012.0,2007.0,1970.0,1995.0,2014.0,1977.0,2018.0,1982.0,2014.0,1993.0,1973.0,1950.0,2012.0,2017.0,1980.0,2025.0,2016.0,2012.0,1999.0,2006.0,2007.0,1971.0,2008.0,2005.0,2016.0,1991.0,1965.0,2012.0,2014.0,1978.0,2006.0,1995.0,1986.0,1999.0,2009.0,2004.0,1983.0,2001.0,1950.0,1967.0,1992.0,2006.0,1993.0,1978.0,1977.0,2004.0,2001.0,2012.0,2022.0,1978.0,2010.0,2010.0,1978.0,2012.0,2007.0,2014.0,1997.0,2004.0,1982.0,1978.0,2002.0,2003.0,2015.0,1999.0,2016.0,2007.0,1961.0,1973.0,2019.0,2001.0,2012.0,1998.0,1983.0,2012.0,2018.0,1981.0,1974.0,2005.0,2001.0,1995.0,1952.0,1971.0,1969.0,1981.0,1989.0,1998.0,2015.0,2002.0,1996.0,1998.0,1985.0,2000.0,2002.0,1983.0,1969.0,2001.0,2006.0,1989.0,1969.0,1997.0,2003.0,2020.0,2009.0,2002.0,1999.0,2005.0,1965.0,1997.0,2024.0,2025.0,1999.0,2002.0,1994.0,2001.0,1976.0,2019.0,1979.0,2012.0,2002.0,1980.0,1981.0,2003.0,2021.0,1992.0,2017.0,2005.0,2004.0,2013.0,1974.0,2010.0,1978.0,2002.0,1986.0,2007.0,2001.0,1999.0,1995.0,2014.0,1942.0,2012.0,2012.0,2000.0,2020.0,2019.0,1996.0,1972.0,2011.0,1983.0,2018.0,1973.0,2008.0,2008.0,2004.0,1971.0,1989.0,1969.0,2012.0,1996.0,1963.0,1973.0,1994.0,1980.0,1968.0,1988.0,1996.0,1989.0,1995.0,1970.0,1994.0,1998.0,1997.0,1993.0,1976.0,2016.0,2015.0,2022.0,1984.0,1996.0,1973.0,1978.0,2010.0,1998.0,2021.0,2003.0,2007.0,1987.0,1986.0,2003.0,2008.0,2004.0,1970.0,2007.0,2000.0,1981.0,2000.0,2008.0,2003.0,1987.0,1986.0,2006.0,2002.0,1994.0,2012.0,1979.0,1968.0,2014.0,1981.0,2017.0,2015.0,2001.0,1992.0,1991.0,1996.0,1996.0,2017.0,2005.0,1977.0,1978.0,2003.0,2021.0,1992.0,2019.0,1982.0,2022.0,2004.0,1980.0,1983.0,1990.0,2017.0,2021.0,1978.0,1996.0,1964.0,2005.0,2008.0,2021.0,2016.0,2004.0,1993.0,2010.0,1957.0,2003.0,2004.0,2004.0,2003.0,2009.0,2007.0,2010.0,2002.0,2016.0,1999.0,2012.0,2003.0,1973.0,2011.0,1998.0,2014.0,2006.0,2000.0,1998.0,1998.0,2001.0,2012.0,1996.0,2006.0,1986.0,1993.0,2020.0,2018.0,2002.0,1996.0,1983.0,1977.0,1973.0,2009.0,2004.0,2002.0,1999.0,1975.0,1971.0,2021.0,1984.0,2018.0,2014.0,2007.0,2005.0,1995.0,1984.0,1970.0,2014.0,2009.0,2008.0,1983.0,2009.0,2015.0,2010.0,2004.0,2023.0,2000.0,2012.0,2013.0,1992.0,1999.0,2014.0,2021.0,1996.0,1980.0,2007.0,2000.0,1970.0,2012.0,2004.0,2001.0,1999.0,1998.0,1995.0,1995.0,1995.0,1986.0,1986.0,1983.0,1977.0,1973.0,1994.0,1983.0,2007.0,1990.0,1990.0,1995.0]},"kind":"numeric","n":5411,"n_null":57,"n_unique":99,"null_rate":0.010534097209388284,"stats":{"iqr":22.0,"kurtosis":1.996502176474011,"max":2025.0,"mean":1997.8276055285767,"median":2001.0,"min":1870.0,"n_outliers":49,"outlier_rate":0.009152035861038476,"q1":1987.0,"q3":2009.0,"skew":-0.9738071931846934,"std":15.785219399352227,"zero_rate":0.0}},{"alerts":[],"column":"classification","extras":{"singletons":0,"top_values":[["Class B",2722],["Class A",2655],["Class C",34]]},"kind":"categorical","n":5411,"n_null":0,"n_unique":3,"null_rate":0.0,"stats":{"cardinality":3,"entropy":1.0486006898694666,"entropy_ratio":0.6615933748542029,"top_rate":0.5030493439290334,"top_value":"Class B"}},{"alerts":[{"code":"near_unique","level":"info","message":"99.9% of rows are unique strings"}],"column":"description","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[2,4,21,56,108,185,376,551,525,568,692,495,486,369,330,196,135,99,74,42,26,23,10,9,6,4,6,2,1,2,3,0,0,2,1,0,0,0,0,2],"edges":[10.0,15.275,20.55,25.825000000000003,31.1,36.375,41.650000000000006,46.925000000000004,52.2,57.475,62.75,68.025,73.30000000000001,78.575,83.85000000000001,89.125,94.4,99.67500000000001,104.95,110.22500000000001,115.5,120.775,126.05000000000001,131.325,136.60000000000002,141.875,147.15,152.425,157.70000000000002,162.97500000000002,168.25,173.525,178.8,184.07500000000002,189.35000000000002,194.625,199.9,205.175,210.45000000000002,215.72500000000002,221.0]},"near_unique":true,"sample":["Rescue workers describes possible stalking on the Cahaba River outside Montevallo","Possible bigfoot activity near Walker County line.","Hikers off Lewis River Trail find large footprint east of Cougar","Hunters on bikes have close encounter with a sasquatch near Randle","Woman recalls daylight sighting while driving and a possible incident at a home east of Gaylord","Possible sighting near Bowser on Vancouver Island","County workers find possible footprints near Bena","Man and girlfriend, camping, hear loud footsteps and tree knocking near Cispus, Washington","Possible reoccurring activity at a hunting spot near Republic","Brief daylight sighting within the city limits of Show Low","Silhouette seen protruding above brushline near Mogadore Reservoir.","Man recalls incident as a child in a swampy area near Cazenovia","Possible ongoing activity described and knocks recorded at a rural home near Paris","Daytime road crossing seen near Ashland","Nighttime sighting by motorists along I-55 near Lincoln","Possible collision with vehicle outside Homestead","Possible intimidation in the late afternoon reported by hikers in the Big Tujunga Canyon area.","Man sees large, hair-covered figure while riding on train near the Cascade Tunnel","Likely road crossing sighting of a sasquatch 20 miles southeast of Moncton, New Brunswick, Canada","Man witnesses the sillouette of a tall creature while boiling sap near Sault Ste. Marie","Youth has pre-dawn encounter on the way to deer stand near Mitchellville","Camping family glimpses a grey animal twice in three days","Hiker has a possible daytime sighting near Crater Lake","Possible sighting at Mono Lake at Sunrise","Three hunters see strange figure walking towards them in the pre-dawn woods.","Hunter hears very loud scream at short range near Brazos River","Road-crossing sighting by motorist on Hwy 220 north of Candor","Possible early morning encounter by hunters in the Green Swamp","Couple have night sighting near Lake Tahoe","Strange, tall creature seen crossing the road at Kennedy Lake","Lone camper hears vocalization","Brushfire fighters find and photograph large track in remote area on the northside of Lac Seul","Couple hears repetitive calls near Oregon Caves N. M","Daytime sighting while traveling on US-7 North of Williamstown","Possible harrassment at a secluded cabin near Zachariah","EXPEDITION REPORT for incidents on Spring 2024 MN trip","Possible repeat approaches outside Circleville","Hunter has early morning encounter 8 miles north of Riverdale","Unknown nighttime visitor at a campsite on Lake Jeannette","Two people in canoe see creature on shoreline","Series of vocalizations around the town of Joyce","Possible vocalizations heard by camper near Tygart Valley River","Motorists have possible nighttime sighting in Green Belt Forest Preserve","A tall black creature covered with hair and very muscular was seen walking quickly across a clearing","Campers hear possible vocalization and have trailer shaken at Interstate State Park","Possible rock-knocking heard by hikers near Pitt Lake","Woman driving at night hits a man-like animal near Mayetta","Essex County, April 1978, Encounter with Creature","Early evening sighting by two women hiking in Bailey","Skydivers witness creature while flying over mountain"],"top_values":[],"top_words":[["near",2283],["a",1937],["of",1503],["sighting",1436],["in",1286],["possible",1117],["by",1013],["the",972],["and",899],["on",855],["at",739],["encounter",521],["while",491],["has",483],["night",437],["outside",422],["lake",421],["creature",414],["daylight",410],["two",410],["vocalizations",398],["road",373],["heard",357],["man",344],["hunter",339]],"vocab_skipped":null,"word_histogram":{"counts":[17,62,429,476,613,1292,620,509,710,220,258,70,40,40,20,10,7,8,2,2,2,1,0,0,1,0,0,0,1,1],"edges":[2.0,3.3666666666666667,4.733333333333333,6.1,7.466666666666667,8.833333333333334,10.2,11.566666666666666,12.933333333333334,14.3,15.666666666666668,17.03333333333333,18.4,19.766666666666666,21.133333333333333,22.5,23.866666666666667,25.233333333333334,26.6,27.96666666666667,29.333333333333336,30.7,32.06666666666666,33.43333333333334,34.8,36.166666666666664,37.53333333333333,38.9,40.266666666666666,41.63333333333333,43.0]}},"kind":"text","n":5411,"n_null":0,"n_unique":5407,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.00018480872297172427,"duplicate_rate":0.0007392348918868971,"emoji_rate":0.0,"len_max":221,"len_mean":67.04213638883755,"len_median":65.0,"len_min":10,"len_p95":101.5,"n_duplicates":4,"n_empty":0,"one_word_rate":0.0,"readability_flesch_mean":55.70520615200523,"url_rate":0.0,"vocab_size":7169,"word_mean":10.620772500462023,"word_median":10.0}}],"insights":{"errors":[],"insights":[{"confidence":"high","critiques":[],"evidence_keys":["state.top_values","county.top_values","year.stats","month.top_values","classification.top_values","row_count","county.stats.n_empty"],"featured_charts":[{"caption":"Top reporting states \u2014 note Washington, California, and Ohio lead by a wide margin.","column":"state","kind":"bar"},{"caption":"Class A and Class B are nearly even while Class C is negligible.","column":"classification","kind":"donut"},{"caption":"Reports skew toward recent decades, with a long thin tail back to 1870.","column":"year","kind":"histogram"},{"caption":"Sightings cluster in summer and early fall, peaking in August and October.","column":"month","kind":"bar"},{"caption":"Most-named counties, led by Pierce; watch for the 338 missing county entries.","column":"county","kind":"bar"}],"model":"anthropic:claude-opus-4-7","narrative":"This dataset catalogs 5,411 Bigfoot sighting reports from the BFRO database, with fields covering location (state, county), timing (year, month), a classification grade, a short description, and a source URL. Geographically, sightings concentrate heavily in Washington (631), California (431), and Ohio (317), and the most common county is Pierce \u2014 worth a closer look as the data skews toward the Pacific Northwest. Temporally, the year distribution is left-skewed (mean 1997, median 2001, range 1870\u20132025), so most reports come from the late 1990s onward, and August/October/July dominate the month field, hinting at a warm-season reporting pattern. Classification is nearly a coin-flip between Class A (2,655) and Class B (2,722), with Class C almost absent (34) \u2014 that imbalance is something to flag before any modeling. Note also that 338 county values are empty even though state coverage is complete.","scope":"dataset","target":"__global__"},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.skew"],"model":"anthropic:claude-opus-4-7","narrative":"This column is almost certainly a row identifier: all 5411 values are unique with no nulls, spanning 60 to 79711. The wide range relative to the row count suggests sparse, non-sequential IDs (likely assigned from a larger source system) rather than a dense 1..N index. Skew of 0.91 and median 16598 vs mean 23288 are expected artifacts of ID allocation, not meaningful distribution signals.","role":"identifier","scope":"column","target":"id","treatment":"Exclude from modelling; retain as a join key."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This is a US state field with 53 distinct values across 5411 rows and no nulls, suggesting it includes the 50 states plus a few extras like DC or territories. Distribution is fairly even (entropy ratio 0.877), but Washington leads at 11.66% (631 rows) \u2014 unusually high for a national sample and ahead of California (431), hinting at geographic bias toward the Pacific Northwest.","role":"feature","scope":"column","target":"state","treatment":"One-hot or target-encode; consider grouping the long tail and noting the Washington over-representation."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds US state codes as two-letter lowercase abbreviations, with 53 distinct values across 5411 rows and no nulls \u2014 slightly more than the 50 states, suggesting territories or DC are included. Distribution is broad (entropy ratio 0.88) but tilts toward Washington (wa, 11.7%) and California (ca, 431), which is unusual since wa outranks ca despite California's larger population.","role":"feature","scope":"column","target":"state_code","treatment":"Use as a categorical feature; one-hot or target-encode for modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.duplicate_rate","stats.n_empty","stats.one_word_rate","stats.word_mean","stats.len_max","top_values","top_words"],"model":"anthropic:claude-opus-4-7","narrative":"Single-word US county names (e.g., Pierce, Jefferson, Lewis, Snohomish, Skamania) acting as a geographic categorical feature. Heavy duplication is expected for this kind of field (duplicate_rate 0.81, 1022 unique values across 5411 rows), but 338 empty strings are recorded as non-null and should be treated as missing. The county mix (Snohomish, Skamania, Pierce, King) skews toward Washington/Pacific Northwest, with some overlap names like Jefferson and Jackson appearing in many states.","role":"feature","scope":"column","target":"county","treatment":"Convert empty strings to nulls and encode as a categorical (target/frequency encode given ~1k levels)."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.url_rate","stats.one_word_rate","stats.duplicate_rate","stats.len_min","stats.len_max","top_words"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds a unique BFRO report URL for each of the 5411 rows, all following the pattern https://www.bfro.net/gdb/show_report.asp?id=<n>. Every value is distinct (n_unique=5411, duplicate_rate=0.0), non-null, and url_rate is 1.0, so it functions as a per-row record locator rather than a feature. Lengths are tightly bound between 46 and 49 characters, consistent with only the numeric id varying.","role":"identifier","scope":"column","target":"url","treatment":"Keep as a row-level link for traceability; drop from modelling or extract the trailing id as a foreign key."},{"confidence":"high","critiques":[],"evidence_keys":["n_unique","null_rate","stats.cardinality","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column captures the month name of an event, with August (634), October (632), and July (618) leading \u2014 consistent with a summer/autumn-skewed seasonal pattern. Cardinality is 32, far above the expected 12, so there are 20 extra non-month tokens polluting the field that need investigation. Null rate is 2.96% and entropy ratio is 0.76, indicating reasonably spread but not uniform distribution.","role":"feature","scope":"column","target":"month","treatment":"Normalize to the 12 canonical months, then one-hot or cyclically encode."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","n_unique","median","q1","q3","skew","n_outliers","outlier_rate","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Year of record, ranging from 1870 to 2025 across 99 distinct values with a median of 2001 and IQR spanning 1987-2009. The distribution is left-skewed (skew -0.97) with 49 outliers (0.9%) on the early-year tail, and 1.05% of rows are null.","role":"timestamp","scope":"column","target":"year","treatment":"Treat as a temporal feature; consider bucketing by decade or clipping pre-1970 outliers before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"A three-level categorical label (Class A, B, C) with no nulls across 5411 rows. The distribution is essentially binary in practice: Class B (50.3%) and Class A are nearly tied, while Class C appears only 34 times, making it a rare class that will be hard to model or evaluate.","role":"label","scope":"column","target":"classification","treatment":"One-hot or ordinal encode; consider stratified splits or merging Class C given its rarity."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.len_mean","stats.len_median","stats.len_p95","stats.word_mean","stats.vocab_size","stats.duplicate_rate","stats.boilerplate_rate","stats.readability_flesch_mean","top_words","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Short free-text descriptions, almost certainly sighting summaries: 5407 of 5411 values are unique with a mean length of 67 characters and ~10.6 words. The vocabulary of 7169 tokens is dominated by 'near', 'sighting', and 'possible', suggesting templated phrasings about location-based observations. Duplicates and boilerplate are negligible (4 dupes, boilerplate_rate 0.00018), and Flesch ~55.7 indicates fairly readable prose with no URLs or emoji.","role":"free_text","scope":"column","target":"description","treatment":"Tokenize and embed (or extract entities like species/location) before modelling; do not use as a key."}],"providers":["anthropic:claude-opus-4-7"],"total_usage":{"completion_tokens":3008,"prompt_tokens":11812,"total_tokens":14820}},"language_counts":{},"meta":{"generated_at":"2026-05-01T18:06:57+00:00","mode":"full","row_count":5411,"sampled_rows":5411,"seed":42,"source":"/home/coolhand/html/datavis/data_trove/data/wild/bigfoot_sightings.json"},"notes":[],"saturn_version":"0.2.0","schema":{"classification":"categorical","county":"text","description":"text","id":"numeric","month":"categorical","state":"categorical","state_code":"categorical","url":"text","year":"numeric"}}
