{"attributions":[{"component":"fastText lid.176 language identification model","license":"CC-BY-SA-3.0","note":"Language counts in this report were produced with the fastText lid.176 model, licensed CC-BY-SA-3.0. This report is a derivative work and carries the same license for those figures.","url":"https://fasttext.cc/docs/en/language-identification.html"}],"columns":[{"alerts":[{"code":"high_skew","level":"info","message":"skew=-2.84"},{"code":"outliers","level":"warn","message":"9.4% rows beyond 1.5 IQR"}],"column":"latitude","extras":{"histogram":{"counts":[7090,1218,4088,9707,4,3,1,20,72,110,287,726,991,714,902,581,297,341,603,690,435,1927,1608,1738,6214,5180,20824,47917,55501,77688,45229,28613,24054,7237,1480,490,92,86,9,3],"edges":[-87.36667,-82.97000325,-78.5733365,-74.17666975,-69.780003,-65.38333625,-60.986669500000005,-56.590002750000004,-52.193336,-47.79666925,-43.4000025,-39.003335750000005,-34.606669000000004,-30.210002250000002,-25.813335500000008,-21.41666875,-17.020002000000005,-12.62333525000001,-8.226668500000002,-3.830001750000008,0.5666650000000004,4.963331749999995,9.359998499999989,13.756665249999998,18.153331999999992,22.549998749999986,26.946665499999995,31.34333224999999,35.73999899999998,40.13666574999999,44.5333325,48.92999924999998,53.32666599999999,57.72333275,62.11999949999998,66.51666624999999,70.913333,75.30999974999997,79.70666649999998,84.10333324999999,88.5]},"sample":[-76.67555,-76.71667,-76.71667,-72.0,-31.61667,27.06667,26.94167,19.33265,18.24667,18.9942,18.16333,19.16667,-76.27743,-76.26796,-72.95236,-72.95,-72.983056,-72.775,-72.774444,28.56367,19.58107,-24.0,-20.9818,-85.63333,-84.0,-84.0,-84.0,-84.0,-71.5,-71.5,-71.5,-71.5,-71.5,-71.5,-71.5,-71.5,-71.5,-71.5,-71.5,-71.5,61.2180556,31.2230556,35.8422222,36.2613889,34.3319444,33.4352778,33.4222222,34.4233333,34.1591667,33.1191667,33.9163889,35.6469444,33.5422222,37.4419444,33.8491667,32.7152778,37.775,37.775,37.9577778,39.1502778,34.0983333,39.6477778,40.0375,39.7383333,41.4338889,39.7458333,26.5625,28.3858333,28.5555556,29.8944444,30.4380556,26.2125,27.9472222,28.0219444,30.7847222,31.4716667,47.3352778,39.1611111,42.1680556,40.0363889,41.6888889,39.8016667,36.9888889,37.0030556,38.9430556,41.7411111,41.7,41.2833333,42.3369444,42.1013889,44.6388889,44.6522222,43.4194444,46.4736111,37.3058333,38.3686111,37.4536111,37.2152778,38.45,36.1583333,34.2255556,40.8577778,35.0613889,42.2602778,42.6338889,40.7669444,40.8041667,42.2552778,44.6366667,40.4405556,34.3738889,34.8038889,36.145,36.5483333,30.2669444,32.9536111,29.7630556,32.8341667,30.5080556,29.7027778,36.6775,37.2708333,47.0344444,45.6388889,39.5105556,65.6298,44.3872,35.9907,51.0921,53.99,42.18,34.92,42.03,38.87,35.85,30.28,32.72,39.28,37.08,32.33,39.27,30.48,33.45,41.6,36.7,41.87,40.88,30.8,32.52,45.12,36.83,31.58,30.18,44.8,37.92,32.72,35.03,35.82,31.42,33.5,35.83,36.9,37.02,33.0,40.37,40.08,32.53,33.77,38.67,27.42,33.5,38.53,39.32,44.88,31.2,48.15,45.75,39.3,42.72,28.92,34.73,32.95,32.63,29.67,38.2,35.22,39.28,39.73,27.63,42.0,45.32,41.1,38.3,33.27,41.03,35.53,36.32,42.92,31.92,37.69,37.24,34.14,42.84,26.37,39.54,34.9934,34.8564,37.6134,39.2823,30.4829,42.6032,35.2279,37.4504,33.9298,39.5671,38.1657,39.8176,31.2173,39.7119,36.8151,38.9509,29.9611,31.1255,32.7458,29.5354,36.67,34.4535,47.1,35.47,44.911,41.766,40.1254,43.1136,30.2955,41.41,32.4898,40.422,41.7124,41.7762,34.461,32.6733,33.607,41.463,64.3113181,35.1413105,14.271427,33.6535742,-41.3768771,-20.2796977,43.250406,26.4260649,9.6591506,14.7742361,-35.856539,39.7556217,8.79985,8.4,31.1,18.8,45.08,43.22,34.62,30.0,38.3,37.37,33.85,34.7811,43.2,34.2203,42.3319,33.945,46.1575,42.1682,45.6289443,54.1665643,46.1174365,50.1650821,49.6236214,43.2688165,-43.3878788,47.8608847,48.0129641,42.8073156,48.4260175,42.8002324,41.3578183,43.5490166,45.1622874,-37.1552482,47.6155536,47.6546568,39.346753,48.8158718,50.6397222,47.2573893,29.0216899,43.3807473,43.835209,47.2581975,51.3781177,-33.819432,38.7529364,49.4658253,47.7599626,40.8656274,43.4033377,42.5034051,43.6639886,43.2694758,46.0398981,31.6371517,41.6476399,44.2488648,46.2891605,39.7505652,39.6914601,39.5625411,39.6615691,49.0043582,40.1101255,45.8188846,47.0231359,50.6883723,44.3220324,43.5773053,43.032608,43.4593333,46.1050331,42.9176763,43.0000568,45.8986399,42.7705696,37.9750457,45.4702632,-19.1453793,49.2474567,50.6177246,48.8767611,48.2292675,42.9726037,45.6139257,44.5484395,45.1905412,43.38957,41.7297384,44.481995,48.4179019,45.6113889,55.4831458,42.1175638,8.1564332,40.0425993,40.1332802,39.7670071,37.4361629,41.875057,44.3072505,59.6119817,35.6308513,64.7809483,46.1542873,44.3188699,47.1577618,42.2731879,46.9412275,54.3935743,41.2718137,31.222992,40.5849979,54.636085,54.4166285,53.1189427,53.5003666,57.677911,42.1313491,58.4978205,49.5668794,40.8197165,50.9836063,51.3734292,59.2070803,18.4440857,56.8285192,57.1331937,54.1461293,53.5553101,58.758591,48.9224879,10.3881094,46.2108232,9.5275836,9.2186988,43.9227353,8.1318777,45.4059872,8.247943,45.4875918,43.4864619,64.0057665,65.0432257,58.7168528,56.5603123,55.9687554,55.201469303413,50.627197806984,50.0464089,13.42458,19.207728,52.949404091342,41.605976,52.859514311024,32.763,32.63622,48.41311,30.053766,50.205730237353,39.658685,55.740502,45.804,43.975667,45.397,47.857505,47.80163,44.480156,44.33069,45.020941,44.126401,43.30208,43.0285728,41.88784,59.006634,52.23210188886,53.107692,42.3599,51.18178,41.823248,43.718,47.228889,53.999577501496,53.87378443,51.421152209625,57.248192176032,40.49164,50.2342939,51.422432244119,48.52345,37.867973,47.358696,51.6615132,46.8421,51.2013817,54.822762,51.80702,53.148641964017,55.071194558647,36.861,39.6163009,46.0005,51.75511,55.260022,54.18925,43.004887,56.458026261944,50.8147791124,51.761321902901,58.922323180882,43.242087,51.914345311409,52.274933999359,51.938268911804,24.34699,54.80856470453,47.1233,51.723522685911,51.24952,55.335417139,55.426931,55.564655433922,59.57014,51.805000711625,49.959215995681,51.851858866048,37.30833,29.17805,40.91689,41.86425,48.25206,41.89011,30.509,46.04722,42.4641163,40.2760019,41.1423205,30.2576735,48.156394,37.2271005,42.8396692,36.1140611,29.9196714,43.8066226]},"kind":"numeric","n":354770,"n_null":0,"n_unique":215964,"null_rate":0.0,"stats":{"iqr":12.845811099999999,"kurtosis":7.302105619332297,"max":88.5,"mean":32.66081797980598,"median":40.5983333,"min":-87.36667,"n_outliers":33355,"outlier_rate":0.09401865997688644,"q1":33.6888889,"q3":46.5347,"skew":-2.8404050745221947,"std":31.011251046171218,"zero_rate":0.0006370324435549793}},{"alerts":[],"column":"longitude","extras":{"histogram":{"counts":[90,969,1120,814,413,839,18752,8803,21820,47491,45346,24836,4804,485,608,503,76,376,2511,40337,29096,36101,12918,13238,6091,5213,4220,604,3575,777,745,1540,1434,1238,1806,1475,730,8482,3693,801],"edges":[-179.2833333,-170.3012499675,-161.31916663500002,-152.33708330250002,-143.35499997,-134.3729166375,-125.390833305,-116.4087499725,-107.42666664000001,-98.44458330750001,-89.46249997500001,-80.4804166425,-71.49833331,-62.51624997750001,-53.534166645,-44.5520833125,-35.569999980000006,-26.58791664750001,-17.605833315000012,-8.623749982500016,0.358333349999981,9.340416682500006,18.322500015000003,27.3045833475,36.286666679999996,45.26875001249999,54.25083334499999,63.232916677499986,72.21500001000001,81.19708334250001,90.179166675,99.1612500075,108.14333334,117.1254166725,126.10750000499999,135.0895833375,144.07166666999998,153.05375000249998,162.03583333499998,171.01791666749997,180.0]},"sample":[159.30823,159.33333,159.66667,26.0,118.03333,16.06667,16.566,54.79373,54.00188,54.18137,54.16,54.40333,156.45176,156.51378,160.50719,160.43333,75.229167,75.3181,75.321667,12.90467,56.47213,-69.0,22.9766,-68.7,168.0,168.0,168.0,168.0,35.66667,35.66667,35.66667,35.66667,35.66667,35.66667,35.66667,35.66667,35.66667,35.66667,35.66667,35.66667,-149.9002778,-85.3905556,-90.7041667,-90.9711111,-92.9130556,-112.3575,-111.8219444,-118.4711111,-118.5002778,-117.0855556,-118.3516667,-117.8116667,-117.7822222,-122.1419444,-118.3875,-117.1563889,-122.4183333,-122.4183333,-121.2897222,-123.2066667,-118.3258333,-104.9872222,-107.9125,-104.3227778,-73.1172222,-75.5469444,-81.9497222,-80.7422222,-82.4505556,-81.3147222,-84.2808333,-80.25,-82.4586111,-81.7330556,-83.56,-83.6469444,-116.8875,-89.4936111,-88.4280556,-88.9569444,-88.9811111,-89.6436111,-84.6,-88.2344444,-84.5441667,-70.5994444,-70.0277778,-70.1,-71.2097222,-72.5902778,-70.0161111,-84.1297222,-83.9508333,-93.8986111,-89.5180556,-93.7780556,-90.7947222,-93.2980556,-91.0083333,-81.1477778,-77.945,-74.4263889,-106.1908333,-73.81,-73.5541667,-72.9966667,-73.1694444,-73.9027778,-123.1047222,-79.9961111,-80.0736111,-81.2394444,-82.4169444,-82.5619444,-97.7427778,-96.89,-95.3630556,-97.2286111,-97.6786111,-96.7802778,-76.9227778,-79.9416667,-122.8219444,-122.6602778,-79.7986111,-165.2551,-129.5367,-96.803,-130.1497,-165.116,-104.42,-88.58,-94.53,-98.58,-95.23,-83.75,-102.4,-97.12,-92.07,-90.35,-95.38,-84.55,-99.85,-96.5,-88.45,-103.67,-97.93,-85.23,-92.92,-95.03,-101.27,-94.7,-81.75,-96.7,-95.17,-96.85,-89.4,-91.12,-87.43,-94.9,-86.43,-94.33,-98.57,-90.95,-98.1,-98.33,-90.28,-101.02,-86.45,-82.58,-96.7,-93.22,-83.25,-89.93,-90.0,-119.78,-105.17,-102.25,-75.78,-97.32,-76.73,-90.43,-100.75,-95.02,-84.85,-100.08,-85.48,-103.58,-81.98,-104.0,-122.57,-96.47,-85.97,-86.88,-112.08,-81.08,-86.77,-70.85,-84.55,-85.06,-99.89,-92.58,-90.51,-97.78,-110.74,-99.569,-87.0143,-99.3765,-90.4076,-93.2413,-95.3649,-86.3916,-97.6697,-78.2779,-89.6256,-90.218,-101.878,-83.9785,-97.7802,-95.3178,-86.6385,-90.1782,-92.5368,-84.4357,-96.2906,-86.59,-87.4978,-109.98,-101.57,-99.4527,-73.664,-101.5284,-89.6289,-89.3658,-89.55,-80.3151,-88.367,-88.3913,-104.2608,-84.3531,-87.819,-88.3313,-95.525,-20.3018075,36.7712227,99.8789096,135.9275713,174.8683817,-174.804115,14.1655607,-14.1561847,-82.7519414,120.249947,174.9403459,-74.0998869,167.7309,161.9,140.0,73.4,-88.08,-92.38,-99.35,-95.25,-89.83,-122.03,-84.01667,-80.1422,-71.55,-85.9602,-96.1086,-80.7579,-116.0542,-77.6383,6.0449616,-2.2706575,0.3986545,7.6228557,5.5511139,-4.3996027,170.2058893,16.1689218,16.2295889,-8.4465523,16.339402,-89.6537974,1.9242375,18.0542246,21.8543014,142.5070023,15.9724972,16.1436756,27.8074534,21.1669624,19.4794444,17.9836936,-13.7124427,12.7483506,3.6075796,-2.4317254,7.7789737,150.0236098,-0.5053532,5.9441448,15.8022018,0.3472683,12.9598657,12.4926536,6.9094858,19.1162481,11.5135887,35.2847595,24.3558575,11.689217,13.8404895,2.7908267,2.5991071,2.583529,2.5676871,19.6519084,113.1276497,14.6779367,14.3353875,11.6419505,4.5382311,3.6686715,6.0978655,6.9217516,12.4860689,-0.7284984,-117.8465855,14.5013366,1.3038126,-92.7696662,-0.5160117,-169.8427298,19.8701464,-2.2526897,18.3406663,18.8653299,-1.9046125,13.8675666,33.7397858,13.7459124,19.5650611,-3.008975,15.2150105,15.9596961,11.1924167,-4.3944948,1.8342128,80.9968434,116.0107984,18.4892972,3.3425089,-84.1075364,0.747592,3.30025,60.0050203,139.8785621,-23.683403,10.1189654,4.5475999,9.2365798,1.7482676,17.5862843,-1.9230224,0.6495237,35.3544292,0.2206762,27.202939,29.4058462,32.1854612,32.2022263,32.1707671,44.7122511,36.7052967,129.9320695,-3.6371959,38.4774889,9.2798834,52.2697283,78.9280533,67.9335126,30.1308442,24.8524117,36.3166951,49.385963,9.5495049,-13.1559824,6.2626112,46.7770263,46.8361652,11.3449697,47.9295586,16.1083616,47.6225342,148.6136025,-7.9990971,-51.6349822,-52.3631326,54.6080805,54.2464777,31.8230519,-6.2116490046153,-3.7368392589961,12.3478425,103.7769,72.905026,-4.1611093287844,15.883583,-3.9523849004224,-94.982,-91.405026,9.83713,35.07986,-5.3622660094005,2.911975,12.185337,1.226,1.859667,4.327,-3.86957,-4.21685,2.561165,4.24077,4.266543,3.343097,-1.638693,-2.0495863,25.86295,5.574628,-3.4870030424271,13.824961,-8.0302,11.42165,2.176114,5.016,15.3475,-1.4507041998424,13.17432368,-1.1126137826782,-5.5105650457652,49.34908,12.4289706,-1.8476482577412,9.46204,32.493499,1.746164,6.4525852,6.826544,11.3232335,11.480487,21.24275,-6.252010530572,-1.8699923973358,-111.6019,9.3328321,3.799,6.947409,14.77011,17.64828,-2.669294,-5.3948765167481,-1.5244370853,-2.2524990818808,-2.7404964850204,-1.583501,-5.022276342347,-3.4370189194806,-4.74840013876,124.16769,-2.0983433571433,-1.0458,-5.0535046506037,11.6285,-1.91326965813,13.712761,-5.3185979678267,16.25811,-10.015451423448,-6.276676413985,-2.9973670105362,-106.4917,-96.29222,-111.8038,-73.00099,-116.0969,-88.18031,-90.6763,-122.1914,-82.9567569,-79.8374649,-77.4621475,-88.1073229,-122.2444099,-80.4441454,-71.49148939999999,-115.170627,-95.35716459999999,-103.4278192]},"kind":"numeric","n":354770,"n_null":0,"n_unique":223129,"null_rate":0.0,"stats":{"iqr":104.81386012499999,"kurtosis":0.11649899879357895,"max":180.0,"mean":-31.75288824253706,"median":-42.65733525,"min":-179.2833333,"n_outliers":827,"outlier_rate":0.0023310877469910085,"q1":-92.08,"q3":12.733860125,"skew":0.7545307004061931,"std":72.10691945974176,"zero_rate":0.0}},{"alerts":[{"code":"multilingual","level":"info","message":"31 languages detected in sample"},{"code":"duplicates","level":"warn","message":"46.5% duplicate strings"}],"column":"name","extras":{"language_counts":{"__engine":"fasttext:4,815","ar":15,"az":6,"be":14,"ca":51,"ceb":5,"cs":12,"cy":8,"da":38,"de":230,"el":8,"en":3363,"es":156,"eu":23,"fi":7,"fr":279,"hr":5,"hu":24,"id":18,"it":236,"ja":6,"nl":30,"no":7,"pl":28,"pt":30,"ro":9,"ru":102,"sk":10,"sv":17,"tr":7,"uk":11},"language_sample_size":5000,"length_histogram":{"counts":[8769,61484,132248,49793,74096,19324,3592,1239,408,415,461,495,537,395,431,348,245,167,117,69,51,26,22,14,5,6,1,3,4,0,2,0,0,1,0,0,0,0,0,2],"edges":[1.0,6.85,12.7,18.549999999999997,24.4,30.25,36.099999999999994,41.949999999999996,47.8,53.65,59.5,65.35,71.19999999999999,77.05,82.89999999999999,88.75,94.6,100.44999999999999,106.3,112.14999999999999,118.0,123.85,129.7,135.54999999999998,141.39999999999998,147.25,153.1,158.95,164.79999999999998,170.64999999999998,176.5,182.35,188.2,194.04999999999998,199.89999999999998,205.75,211.6,217.45,223.29999999999998,229.14999999999998,235.0]},"near_unique":false,"sample":["Kainsaz","El Chaparral","Cleaven Dyke","Dolmen de Chams","Tornado in KS, 20","The Harrison Cemetery","Tornado in NC, 37","Mousseau-les-Bray 2","Dolmen de La Griutera","Grove Mountains 021502","Unnamed Cave","Tornado in PENNSYLVANIA, LANCASTER","Tornado in ID, 16","Acfer 134","Tornado in WI, 55","UFO Sighting - rolla, MO","Yamato 86125","Munarriko Landa Dolmen 1","Augusta State University","Tornado in MI, 26","Tornado in OK, 40","Grove Mountains 022485","UFO Sighting - new albany, IN","UFO Sighting - fort smith, AR","Gruta dos Pescadores","\u0412\u043e\u0440\u0430\u045e\u0448\u0447\u044b\u043d\u0430","Cueva L-70","UFO Sighting - asheville, NC","Queen Alexandra Range 99691","Report 12510: Vocalizations near Scenic interrupt a camper\u2019s quiet evening","Cova/Avenc Quim Solbas","cova des S\u00f2til","Busa da neve del Vallon Media","Tornado in TX, 48","Tornado in TX, 48","Tornado in FL, 12","Jemn\u00edky Menhir","Tornado in OHIO, RICHLAND","Tornado in IL, 17","Flash Flood in ARIZONA, YAVAPAI","Little Down Barrow Group","Martlesham Bowl Barrow 2","Tornado in GA, 13","Kurhan Go&#322;czewo","Loch Buie Stone Circle","Moore State Park","Tornado in CO, 8","Tornado in LA, 22","UFO Sighting - oglesby, IL","Magleby Nor Langdysse 1"],"top_values":[["Unnamed Cave",19962],["Tornado in TX, 48",9475],["Tornado in KS, 20",4545],["Tornado in OK, 40",4372],["Tornado in FL, 12",3733],["Tornado in NE, 31",3155],["Tornado in IA, 19",3011],["Tornado in IL, 17",2974],["Tornado in MS, 28",2731],["Tornado in MO, 29",2555],["Tornado in LA, 22",2400],["Unnamed Ghost Town",2277],["Unnamed Wreck",2184],["Tornado in MN, 27",2148],["Tornado in CO, 8",2071],["Tornado in AL, 1",1979],["Tornado in GA, 13",1929],["Tornado in SD, 46",1924],["Tornado in AR, 5",1715],["Unnamed Hot Spring",1689]],"top_words":[["in",4976],["tornado",4415],["sighting",3455],["-",3450],["ufo",3408],["unnamed",1404],["cave",1281],["de",870],["tx,",555],["48",555],["ca",479],["la",367],["of",340],["dolmen",313],["yamato",274],["20",266],["1",266],["ks,",263],["40",242],["ok,",241],["fl",231],["12",229],["del",225],["range",224],["31",221]],"vocab_skipped":null,"word_histogram":{"counts":[105780,56821,162248,21591,4501,599,1064,500,774,279,330,90,113,25,20,12,11,3,6,0,1,0,0,0,0,0,0,0,1,1],"edges":[1.0,2.5,4.0,5.5,7.0,8.5,10.0,11.5,13.0,14.5,16.0,17.5,19.0,20.5,22.0,23.5,25.0,26.5,28.0,29.5,31.0,32.5,34.0,35.5,37.0,38.5,40.0,41.5,43.0,44.5,46.0]}},"kind":"text","n":354770,"n_null":0,"n_unique":189861,"null_rate":0.0,"stats":{"allcaps_rate":0.012830848155142769,"boilerplate_rate":0.0,"duplicate_rate":0.46483355413366406,"emoji_rate":2.8187276263494657e-06,"len_max":235,"len_mean":19.99670208867717,"len_median":17.0,"len_min":1,"len_p95":32.0,"n_duplicates":164909,"n_empty":0,"one_word_rate":0.09410885926092961,"readability_flesch_mean":64.79353084415587,"url_rate":0.0,"vocab_size":15811,"word_mean":3.564382557713448,"word_median":4.0}},{"alerts":[{"code":"multilingual","level":"info","message":"22 languages detected in sample"},{"code":"duplicates","level":"warn","message":"38.3% duplicate strings"}],"column":"description","extras":{"language_counts":{"__engine":"fasttext:4,999","als":1,"ba":13,"be":9,"ca":4,"cs":2,"de":28,"en":4893,"es":2,"eu":6,"fr":6,"it":4,"ja":1,"ko":1,"la":1,"no":6,"pl":2,"pt":6,"ru":9,"sl":2,"tt":1,"uk":2},"language_sample_size":5000,"length_histogram":{"counts":[71484,53646,49789,14135,30283,28147,8588,6163,5647,4082,9912,3581,678,439,426,525,479,430,412,576,1185,1361,1320,5787,878,1496,1410,1914,1940,1927,1960,2295,2190,2487,2493,3014,2997,3598,5468,19628],"edges":[1.0,13.475,25.95,38.425,50.9,63.375,75.85,88.325,100.8,113.27499999999999,125.75,138.225,150.7,163.17499999999998,175.65,188.125,200.6,213.075,225.54999999999998,238.025,250.5,262.97499999999997,275.45,287.925,300.4,312.875,325.34999999999997,337.825,350.3,362.775,375.25,387.72499999999997,400.2,412.675,425.15,437.625,450.09999999999997,462.575,475.05,487.525,500.0]},"near_unique":false,"sample":["Meteorite Kainsaz - CO3.2. Mass: Unknowng. Found: Fell.","Former isolated_dwelling; Former population: 2024","Type: Cursus County/Region: Perth and Kinross Alt Name: Blairgowrie Road  Pos Accuracy: 4 Condition: 3 (5 is best)   Ambience: 3  Access: 3  (5 is best)\n                    Lat: 56.548916969168 &nbsp;&nbsp;&nbsp;Long: -3.362524704168\n\n                    Cursus in Perth and Kinross. Once thought to have been a Roman defensive earthwork, excavation of the site revealed it to be a cursus monument and it has been dated to 3600 BC.Monument is about .... (c) Meg. Portal contributors.\n\t\t     Link To M","Type: Burial Chamber or Dolmen County/Region: Languedoc:Gard (30) Alt Name: Bordezac dolmen  Pos Accuracy: 5 Condition: 3 (5 is best)   Ambience: 4  Access: 4  (5 is best)\n                    Lat: 44.3113 &nbsp;&nbsp;&nbsp;Long: 4.06723\n\n                    Dolmen de Chams (or Bordezac dolmen) is covered by a 10 tons capstone. A part of the dolmen is in sandtone and the other part in schist. .   .... (c) Meg. Portal contributors.\n\t\t     Link To More Information","F0, 0.39mi long, 50yd wide","the site in question is the \"glowing tombstone\" , at a distance you can see one tombstone glow in the dark. The tombstone glows until you get to the edge of the cemetery, then it goes dark. You cant really pinpoint the actual tomb and there's no lights around to illuminate it either. Some say its ma","F0, 0.83mi long, 30yd wide","Type: Passage Grave County/Region: Ile-de-France:Seine-et-Marne 77  Pos Accuracy: 2  (5 is best)\n                    Lat: 48.41 &nbsp;&nbsp;&nbsp;Long: 3.229\n                    Hypogee in Ile-de-France:Seine-et-Marne 77. Mousseau-les-Bray 2 is a Hypogee in the community of Mousseau-les-Bray, Departement of Seine-et-Marne, Region of Ile-de-France.... (c) Meg. Portal contributors.\n\t\t     Link To More Information","Type: Burial Chamber or Dolmen County/Region: Catalu\u00f1a  Pos Accuracy: 5  (5 is best)\n                    Lat: 41.813443 &nbsp;&nbsp;&nbsp;Long: 2.1982\n\n                    Burial Chamber (Dolmen) in Catalu\u00f1a. .... (c) Meg. Portal contributors.\n\t\t     Link To More Information","Meteorite Grove Mountains 021502 - L6. Mass: Unknowng. Found: Found.","Access: no","15 injuries, 0 fatalities; $6.00M property damage","F0, 0.1mi long, 10yd wide","Meteorite Acfer 134 - L5. Mass: Unknowng. Found: Found.","F2, 2.0mi long, 10yd wide","Crafts flying over my house it seems like every night.","Meteorite Yamato 86125 - H4. Mass: Unknowng. Found: Found.","Type: Burial Chamber or Dolmen County/Region: Pais Vasco Alt Name: Munarriko Landa 1 Trikuharria  Pos Accuracy: 4  (5 is best)\n                    Lat: 43.36063 &nbsp;&nbsp;&nbsp;Long: -2.962342\n                    Burial Chamber (Dolmen) in Pais Vasco. .... (c) Meg. Portal contributors.\n\t\t     Link To More Information","Bellevue Hall - The ghost of Emily Galt is said to haunt the building. Emily etched her name (\"Emily Galt, 1816\") in the glass of one of the windows before her fianc\u00e9 left and was killed, in the Civil War. Finding out her betrothed was dead; she threw herself out of one of the upper windows, and die","F0, 0.1mi long, 30yd wide","F2, 2.0mi long, 50yd wide","Meteorite Grove Mountains 022485 - H4. Mass: Unknowng. Found: Found.","Large&#44 hovering&#44 triangular shaped object(s) in New Albany&#44 Indiana.","Man and his son witness object following high-altitude aircraft in the daytime sky.","Cave entrance","Former isolated_dwelling; Wikipedia: be:\u0412\u043e\u0440\u0430\u045e\u0448\u0447\u044b\u043d\u0430","Cave entrance","Large white light with a red hue low in the western sky.  Remained for 20 min or more then vanished. ((NUFORC Note:  Venus??  PD))","Meteorite Queen Alexandra Range 99691 - LL5. Mass: Unknowng. Found: Found.","Class B - Report 12510: Vocalizations near Scenic interrupt a camper\u2019s quiet evening","Cave entrance","Cave entrance","Access: no","F0, 0.3mi long, 20yd wide","F0, 0.1mi long, 20yd wide","F1, 3.16mi long, 50yd wide","Type: Standing Stone (Menhir) County/Region: Bohemia Condition: 4 (5 is best)   Ambience: 4  (5 is best)\n                    Lat: 50.21111 &nbsp;&nbsp;&nbsp;Long: 14.11722\n\n                    Standing Stone (Menhir) in the Czech Republic, Bohemia. 1 Meter tall menhir in fields..... (c) Meg. Portal contributors.\n\t\t     Link To More Information","Magnitude 0; 14 injuries, 0 fatalities; $25K property damage","F0, 4.8600mi long, 10yd wide","$2.60M property damage; A thunderstorm produced very heavy rain that caused flash flooding and damage to the Tlaquepaque area of Sedona.","Type: Barrow Cemetery County/Region: Wiltshire  Pos Accuracy: 5 Condition: 3 (5 is best)   Ambience: 4  Access: 3  (5 is best)\n                    Lat: 51.135539819745 &nbsp;&nbsp;&nbsp;Long: -1.810860540741\n\n                    Barrow Cemetery in Wiltshire. Little Down Barrow Group consists of three Bronze Age bowl barrows, two of which are still distinguishable on the ridge of a hill over Great Durnford. \n\nThe.... (c) Meg. Portal contributors.\n\t\t     Link To More Information","Type: Round Barrow(s) County/Region: Suffolk  Pos Accuracy: 5 Condition: 3 (5 is best)   Ambience: 4  Access: 4  (5 is best)\n                    Lat: 52.066920980391 &nbsp;&nbsp;&nbsp;Long: 1.2648018296687\n\n                    Although not as well preserved as its neighbour, it is still reasonably well preserved. Dug into on the W. side,\nit measures 20.0 m. N-S by 16.0 m. transversely and is 0.5 m. high.. The third B.... (c) Meg. Portal contributors.\n\t\t     Link To More Information","F1, 0.5mi long, 10yd wide","Type: Round Barrow(s) County/Region: Pomorskie Alt Name: Go&#322;czewo Round Barrow  Pos Accuracy: 4 Condition: 3 (5 is best)   (5 is best)\n                    Lat: 54.18925 &nbsp;&nbsp;&nbsp;Long: 17.64828\n\n                    Some 0.5km north of the Stropno lake there is a large round barrow. Its stone covering is heavily damaged. The age of the monument remains unknown, although it might be an early medieval burial mounds.... (c) Meg. Portal contributors.\n\t\t     Link To More Information","Type: Stone Circle County/Region: Isle of Mull Alt Name: Lochbuie  Pos Accuracy: 4 Condition: 4 (5 is best)   Ambience: 5  Access: 3  (5 is best)\n                    Lat: 56.358062351267 &nbsp;&nbsp;&nbsp;Long: -5.858088474955\n\n                    Stone Circle in Mull. This 13.4m diameter circle originally consisted of 9 stones, one of which has disappeared and been replaced with a small boulder. The stones range in height from 1.2m to 2m and h.... (c) Meg. Portal contributors.\n\t\t     Link To Mo","People have reported seeing ghostly figures that supposedly committed suicide in the millhouse down from the millpond. The sightings include a young man and young woman hanging together, and the original owner of the mill, who is also hanging in the millhouse.","F1, 0.3mi long, 20yd wide","F2, 25.0mi long, 500yd wide","aLL LIGHTS WENT OFF &#44 BUT&#44 ELECTRONIC EQUIPTMENT CAME ON &#44 EVEN THOUGHT THERE WAS NO POWER  ( THER WERE NO STORMS &#44 THUNDER&#44 LIGHTENING","Type: Long Barrow County/Region: Fyn,\u00a0Langeland and Islands Alt Name: Myrebjerg  Pos Accuracy: 5 Condition: 2 (5 is best)   Ambience: 3  Access: 3  (5 is best)\n                    Lat: 54.764357 &nbsp;&nbsp;&nbsp;Long: 10.678561\n\n                    Langdysse (Long Barrow) in Svendborg. When I first was looking at it from the road I was disappointed and didn't expect much. But, when I climbed up the mound I was taken by surprise - an open burial .... (c) Meg. Portal contributors.\n\t\t     Link To "],"top_values":[["Cave entrance",52067],["Former hamlet",6309],["F0, 0.1mi long, 10yd wide",5680],["Hot Spring",5003],["Shipwreck",3134],["F1, 0.1mi long, 10yd wide",2425],["Former isolated_dwelling",2337],["Access: yes",2062],["Access: no",1439],["Show cave (tourist attraction)",1279],["F0, 0.1mi long, 20yd wide",1091],["F0, 0.1mi long, 50yd wide",1059],["Magnitude 0; $2.5M property damage",1055],["F0, 0.2mi long, 10yd wide",858],["F0, 0.1mi long, 30yd wide",824],["F2, 0.1mi long, 10yd wide",728],["Former village",709],["$1.00M property damage",660],["F0, 0.5mi long, 50yd wide",650],["Access: private",555]],"top_words":[["the",8467],["is",7701],["in",6738],["(5",5576],["of",5472],["to",5412],["a",5213],["wide",4094],["long,",4074],["4",3629],["and",3592],["type:",3580],["lat:",3574],["&nbsp;&nbsp;&nbsp;long:",3574],["(c)",3507],["meg.",3475],["best)\n",3473],["portal",3461],["pos",3387],["accuracy:",3387],["more",3365],["county/region:",3306],["contributors.\n\t\t",3296],["link",3191],["information",3047]],"vocab_skipped":null,"word_histogram":{"counts":[168662,45929,41010,10628,10001,7103,3638,766,662,500,905,1583,2350,945,290,1345,2377,3063,3691,5622,3846,4422,3799,5908,7687,12348,4773,903,13,1],"edges":[1.0,5.466666666666667,9.933333333333334,14.4,18.866666666666667,23.333333333333336,27.8,32.266666666666666,36.733333333333334,41.2,45.66666666666667,50.13333333333333,54.6,59.06666666666667,63.53333333333333,68.0,72.46666666666667,76.93333333333334,81.4,85.86666666666667,90.33333333333334,94.8,99.26666666666667,103.73333333333333,108.2,112.66666666666667,117.13333333333334,121.60000000000001,126.06666666666666,130.53333333333333,135.0]}},"kind":"text","n":354770,"n_null":0,"n_unique":218717,"null_rate":0.0,"stats":{"allcaps_rate":0.0042562787157876935,"boilerplate_rate":0.0002508667587451025,"duplicate_rate":0.3834963497477239,"emoji_rate":0.0,"len_max":500,"len_mean":114.04985201679962,"len_median":40.0,"len_min":1,"len_p95":491.0,"n_duplicates":136053,"n_empty":0,"one_word_rate":0.01018406291400062,"readability_flesch_mean":66.65188545892048,"url_rate":0.008148941567776305,"vocab_size":38639,"word_mean":24.07085153761592,"word_median":7.0}},{"alerts":[],"column":"category","extras":{"singletons":0,"top_values":[["noaa_tornadoes",71813],["osm_caves",70242],["ufo_sightings",60632],["megalithic_portal",60028],["nasa_meteorites",32186],["osm_ghost_towns",18154],["noaa_storm_events",14770],["haunted_places",9717],["noaa_thermal_springs",5003],["bigfoot_sightings",3797],["usgs_earthquakes",3742],["noaa_shipwrecks",3653],["nasa_fireballs",863],["usgs_volcanoes",170]]},"kind":"categorical","n":354770,"n_null":0,"n_unique":14,"null_rate":0.0,"stats":{"cardinality":14,"entropy":2.9854530614507264,"entropy_ratio":0.7841278584653993,"top_rate":0.20242128703103418,"top_value":"noaa_tornadoes"}},{"alerts":[{"code":"one_word","level":"warn","message":"99.5% rows are a single word"},{"code":"allcaps","level":"info","message":"91.3% rows are all-caps"},{"code":"null_rate","level":"warn","message":"41.9% null"},{"code":"short_text","level":"info","message":"95th-percentile length under 20 chars"},{"code":"duplicates","level":"warn","message":"88.6% duplicate strings"}],"column":"date","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[17854,0,1,0,0,151,13,0,1,21,5,0,3,183475,17,0,6,8,10,0,8,7,12,0,180,4425,1,0,1,0,0,0,0,0,0,0,0,0,0,1],"edges":[0.0,0.75,1.5,2.25,3.0,3.75,4.5,5.25,6.0,6.75,7.5,8.25,9.0,9.75,10.5,11.25,12.0,12.75,13.5,14.25,15.0,15.75,16.5,17.25,18.0,18.75,19.5,20.25,21.0,21.75,22.5,23.25,24.0,24.75,25.5,26.25,27.0,27.75,28.5,29.25,30.0]},"near_unique":false,"sample":["1932-01-01","2015-05-08","1971-02-21","","2010-07-28","","2005-06-19","2009-03-26","","2009-01-01","1990-12-21","1971-05-08","1977-07-25","1896-01-01","2013-07-03","2011-08-12","2002-01-01","","","2010-09-12","2010-07-25","2001-01-01","1997-04-05","2001-01-01","2005-06-17","2017-03-07","1976-04-19","1999-06-27","2006-01-01","","1998-05-31","1999-05-31","1999-05-29","2013-07-26","2013-09-14","2008-10-01","1979-06-09","1964-07-26","2014-01-08","1970-04-26","2024-09-26","2021-09-01","1999-10-10","2020-04-12","","","1999-12-22","2010-05-14","1986-01-01","1997-03-01"],"top_values":[["",17854],["1979-01-01",3049],["1988-01-01",2298],["2003-01-01",1732],["1999-01-01",1603],["2000-01-01",1520],["1997-01-01",1514],["1990-01-01",1507],["1986-01-01",1388],["2001-01-01",1300],["2006-01-01",1244],["2002-01-01",1036],["1993-01-01",979],["1987-01-01",921],["1991-01-01",874],["1994-01-01",724],["1974-01-01",698],["1996-01-01",590],["1998-01-01",493],["1995-01-01",493]],"top_words":[["1979-01-01",306],["1988-01-01",247],["2003-01-01",182],["2000-01-01",160],["1990-01-01",159],["1999-01-01",156],["1997-01-01",149],["1986-01-01",132],["2001-01-01",122],["2006-01-01",115],["2002-01-01",112],["1991-01-01",98],["1987-01-01",86],["1993-01-01",75],["1994-01-01",67],["1974-01-01",65],["1985-01-01",63],["1996-01-01",53],["2010-01-01",52],["1995-01-01",50],["1998-01-01",48],["1977-01-01",42],["1983-01-01",40],["1984-01-01",38],["2011-04-27",37]],"vocab_skipped":null,"word_histogram":{"counts":[205261,0,0,0,0,0,0,880,0,0,0,0,0,0,0,56,0,0,0,0,0,0,2,0,0,0,0,0,0,1],"edges":[1.0,1.1333333333333333,1.2666666666666666,1.4,1.5333333333333332,1.6666666666666665,1.8,1.9333333333333333,2.0666666666666664,2.2,2.333333333333333,2.466666666666667,2.6,2.7333333333333334,2.8666666666666667,3.0,3.1333333333333333,3.2666666666666666,3.4,3.533333333333333,3.6666666666666665,3.8,3.933333333333333,4.066666666666666,4.2,4.333333333333334,4.466666666666667,4.6,4.733333333333333,4.866666666666667,5.0]}},"kind":"text","n":354770,"n_null":148570,"n_unique":23500,"null_rate":0.41877836344674013,"stats":{"allcaps_rate":0.9129776915615907,"boilerplate_rate":0.0,"duplicate_rate":0.8860329776915616,"emoji_rate":0.0,"len_max":30,"len_mean":9.330581959262851,"len_median":10.0,"len_min":0,"len_p95":10.0,"n_duplicates":182700,"n_empty":17854,"one_word_rate":0.9954461687681863,"readability_flesch_mean":112.11327500000003,"url_rate":0.0,"vocab_size":8565,"word_mean":1.0048593598448108,"word_median":1.0}},{"alerts":[{"code":"null_rate","level":"warn","message":"55.3% null"}],"column":"country","extras":{"singletons":13,"top_values":[["USA",86583],["US",60634],["",9497],["RU",1481],["BY",205],["KZ",156],["HT",13],["KY",9],["AU",6],["DE",5],["GB",5],["IQ",3],["RO",2],["EC",2],["IT",2],["TW",1],["MX",1],["CW",1],["BS",1],["MT",1]]},"kind":"categorical","n":354770,"n_null":196154,"n_unique":28,"null_rate":0.5529046988189531,"stats":{"cardinality":28,"entropy":1.341214878338975,"entropy_ratio":0.2789922733154305,"top_rate":0.5458654864578605,"top_value":"USA"}},{"alerts":[{"code":"one_word","level":"warn","message":"72.9% rows are a single word"},{"code":"null_rate","level":"warn","message":"82.9% null"},{"code":"short_text","level":"info","message":"95th-percentile length under 20 chars"},{"code":"duplicates","level":"warn","message":"84.9% duplicate strings"}],"column":"city","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[74,0,1497,0,3313,0,7780,0,9464,0,7830,0,8339,0,7192,0,5509,0,3694,0,2353,0,1537,0,800,0,787,0,203,0,155,0,44,0,25,0,13,0,21,2],"edges":[3.0,3.5,4.0,4.5,5.0,5.5,6.0,6.5,7.0,7.5,8.0,8.5,9.0,9.5,10.0,10.5,11.0,11.5,12.0,12.5,13.0,13.5,14.0,14.5,15.0,15.5,16.0,16.5,17.0,17.5,18.0,18.5,19.0,19.5,20.0,20.5,21.0,21.5,22.0,22.5,23.0]},"near_unique":false,"sample":["anchorage","duncannon","pflugerville","whitesburg","baton rouge","boscobel","hanover","manassas","amarillo","litchfield park","newark","pineville","palm bay","nikiski","tampa","south san francisco","encino","corpus christi","genoa","garden city","decatur","mesa","san diego","fresno","mason","latrobe","advance","thousand oaks","biggs","appleton","kingsbury","new york city","new york city","indianapolis","lake in the hills","boston","manson","grand marais","paxton","kansas city","jonesborough","ephrata","orlando","edmonds","seattle","green bay","arlington heights","indianapolis","sacramento","mapleton"],"top_values":[["seattle",468],["phoenix",435],["las vegas",356],["portland",353],["los angeles",343],["san diego",325],["houston",290],["chicago",255],["tucson",237],["miami",229],["orlando",212],["austin",210],["springfield",206],["albuquerque",202],["columbus",197],["sacramento",194],["san jose",187],["denver",184],["san francisco",179],["san antonio",173]],"top_words":[["city",531],["beach",441],["san",412],["lake",295],["park",214],["springs",201],["new",184],["seattle",172],["st.",162],["santa",152],["north",151],["valley",146],["phoenix",139],["west",135],["los",127],["las",125],["fort",118],["angeles",115],["falls",112],["vegas",110],["diego",102],["portland",100],["miami",96],["chicago",86],["houston",86]],"vocab_skipped":null,"word_histogram":{"counts":[44226,0,0,0,0,0,0,15357,0,0,0,0,0,0,0,1029,0,0,0,0,0,0,19,0,0,0,0,0,0,1],"edges":[1.0,1.1333333333333333,1.2666666666666666,1.4,1.5333333333333332,1.6666666666666665,1.8,1.9333333333333333,2.0666666666666664,2.2,2.333333333333333,2.466666666666667,2.6,2.7333333333333334,2.8666666666666667,3.0,3.1333333333333333,3.2666666666666666,3.4,3.533333333333333,3.6666666666666665,3.8,3.933333333333333,4.066666666666666,4.2,4.333333333333334,4.466666666666667,4.6,4.733333333333333,4.866666666666667,5.0]}},"kind":"text","n":354770,"n_null":294138,"n_unique":9149,"null_rate":0.8290949065591792,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.8491060825966487,"emoji_rate":0.0,"len_max":23,"len_mean":8.828638342789286,"len_median":9.0,"len_min":3,"len_p95":14.0,"n_duplicates":51483,"n_empty":0,"one_word_rate":0.7294168096054888,"readability_flesch_mean":21.736675000000034,"url_rate":0.0,"vocab_size":4862,"word_mean":1.288230637287241,"word_median":1.0}},{"alerts":[{"code":"null_rate","level":"warn","message":"58.5% null"}],"column":"state","extras":{"singletons":4,"top_values":[["TX",12727],["CA",8791],["FL",7372],["IL",5329],["KS",5127],["OK",5056],["MO",3905],["CO",3766],["WA",3648],["IA",3647],["OH",3521],["NE",3506],["AL",3196],["PA",3193],["NC",3186],["GA",3112],["MN",3110],["MS",3086],["NY",2951],["LA",2927]]},"kind":"categorical","n":354770,"n_null":207555,"n_unique":118,"null_rate":0.5850410124869634,"stats":{"cardinality":118,"entropy":5.668267392480794,"entropy_ratio":0.8235596923781127,"top_rate":0.08645178820093061,"top_value":"TX"}},{"alerts":[{"code":"null_rate","level":"warn","message":"82.9% null"}],"column":"shape","extras":{"singletons":5,"top_values":[["light",12895],["triangle",6268],["circle",5890],["fireball",4939],["unknown",4359],["other",4209],["sphere",4134],["disk",3853],["oval",2881],["formation",1908],["cigar",1569],["changing",1517],["flash",1025],["rectangle",1010],["cylinder",977],["diamond",884],["chevron",774],["teardrop",560],["egg",555],["cone",235]]},"kind":"categorical","n":354770,"n_null":294138,"n_unique":28,"null_rate":0.8290949065591792,"stats":{"cardinality":28,"entropy":3.7736568730593287,"entropy_ratio":0.784975716218631,"top_rate":0.2126764744689273,"top_value":"light"}},{"alerts":[{"code":"null_rate","level":"warn","message":"82.9% null"},{"code":"high_skew","level":"info","message":"skew=+135.86"},{"code":"outliers","level":"warn","message":"12.8% rows beyond 1.5 IQR"}],"column":"duration_seconds","extras":{"histogram":{"counts":[60612,11,0,3,1,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,1],"edges":[0.01,1656900.00975,3313800.0094999997,4970700.00925,6627600.009,8284500.008749999,9941400.0085,11598300.00825,13255200.008,14912100.007749999,16569000.007499998,18225900.00725,19882800.007000003,21539700.006750003,23196600.006500002,24853500.00625,26510400.006,28167300.00575,29824200.0055,31481100.00525,33138000.005,34794900.00475,36451800.004499994,38108700.00425,39765600.004,41422500.00375,43079400.0035,44736300.003249995,46393200.003,48050100.002749994,49707000.0025,51363900.00224999,53020800.002,54677700.00175,56334600.001499996,57991500.00125,59648400.000999995,61305300.00075,62962200.00049999,64619100.00025,66276000.0]},"sample":[1800.0,240.0,45.0,480.0,10.0,60.0,1800.0,120.0,180.0,1.0,600.0,180.0,5.0,3600.0,600.0,60.0,12.0,20.0,60.0,120.0,180.0,120.0,900.0,900.0,120.0,240.0,10.0,660.0,1200.0,240.0,240.0,900.0,105.0,120.0,10.0,360.0,7.0,45.0,1800.0,600.0,600.0,1800.0,2700.0,4.0,300.0,1.0,15.0,20.0,15.0,10.0,600.0,1800.0,15.0,15.0,1800.0,120.0,300.0,60.0,8.0,300.0,900.0,900.0,300.0,60.0,15.0,18000.0,3.0,600.0,300.0,720.0,1800.0,60.0,10800.0,300.0,1200.0,300.0,10.0,15.0,10.0,600.0,180.0,240.0,300.0,60.0,3600.0,45.0,9000.0,240.0,120.0,120.0,120.0,600.0,2.0,7.0,30.0,1200.0,240.0,5.0,120.0,600.0,600.0,20.0,3600.0,1320.0,5.0,120.0,300.0,14400.0,15.0,60.0,300.0,420.0,900.0,600.0,180.0,600.0,300.0,180.0,180.0,10800.0,360.0,1800.0,300.0,7200.0,900.0,60.0,3.0,120.0,600.0,3.0,120.0,120.0,1.0,120.0,30.0,300.0,90.0,360.0,90.0,300.0,30.0,180.0,300.0,120.0,300.0,30.0,600.0,10.0,10800.0,300.0,1200.0,10.0,60.0,300.0,20.0,30.0,600.0,15.0,60.0,600.0,240.0,600.0,1800.0,780.0,240.0,600.0,240.0,20.0,240.0,45.0,600.0,1200.0,18000.0,1800.0,2.0,45.0,300.0,60.0,20.0,15.0,20.0,600.0,10.0,1200.0,600.0,300.0,1800.0,1200.0,2700.0,1200.0,180.0,900.0,120.0,3600.0,2.0,300.0,1200.0,240.0,60.0,1200.0,180.0,5.0,30.0,180.0,3600.0,15.0,25.0,60.0,7200.0,240.0,480.0,74.0,120.0,7200.0,10.0,300.0,20.0,1800.0,3600.0,2.0,480.0,30.0,600.0,3600.0,180.0,172800.0,60.0,7.0,600.0,7200.0,2700.0,20.0,120.0,300.0,180.0,30.0,4.0,900.0,120.0,1200.0,3600.0,900.0,3600.0,30.0,600.0,15.0,1800.0,600.0,120.0,30.0,180.0,180.0,3.0,600.0,74.0,600.0,30.0,7200.0,6.0,10.0,600.0,1.0,20.0,60.0,600.0,5.0,300.0,600.0,2.0,1800.0,5.0,300.0,2.0,240.0,60.0,300.0,30.0,30.0,600.0,240.0,20.0,600.0,45.0,6.0,10.0,30.0,180.0,45.0,60.0,120.0,30.0,3600.0,300.0,10.0,180.0,8.0,1200.0,30.0,240.0,1200.0,120.0,2.0,30.0,3600.0,2.0,300.0,60.0,3600.0,15300.0,0.5,600.0,240.0,600.0,600.0,120.0,300.0,1800.0,300.0,300.0,120.0,240.0,1200.0,2700.0,4.0,300.0,3.0,2400.0,120.0,10.0,2.0,45.0,30.0,900.0,180.0,1200.0,900.0,45.0,120.0,600.0,420.0,600.0,600.0,600.0,300.0,1800.0,900.0,300.0,60.0,40.0,1800.0,15.0,600.0,180.0,5.0,360.0,300.0,1800.0,600.0,300.0,3.0,14400.0,600.0,420.0,3.0,300.0,30.0,5.0,1200.0,120.0,20.0,1500.0,300.0,300.0,300.0,300.0,60.0,120.0,600.0,420.0,30.0,600.0,10.0,120.0,600.0,45.0,1200.0,180.0,600.0,30.0,300.0,120.0,60.0,60.0,10.0,10.0,420.0,240.0,30.0,1800.0,120.0,3.0,300.0,600.0,10.0,15.0,60.0,300.0,30.0,300.0,60.0,900.0,30.0,1200.0,480.0,3600.0,600.0,300.0,10.0,300.0,180.0,5.0,60.0,5.0,60.0,7.0,5400.0,900.0,600.0,15.0,10.0,120.0,20.0,900.0,600.0,1200.0,60.0,600.0,120.0,300.0,300.0,10.0,60.0,900.0,120.0,600.0,5.0,5.0,4.0,10.0,1800.0,2.0,300.0,180.0,180.0,420.0,900.0,300.0,1800.0,60.0,300.0,300.0,30.0,600.0,600.0,60.0,3600.0,300.0,120.0,4.0,5.0,30.0,600.0,60.0,1.0,1.0,2100.0,20.0,15.0,35.0,4.0,5.0,180.0,120.0,900.0,6.0,900.0,7.0,60.0,300.0,240.0,1.5,5.0,20.0,120.0,900.0,300.0,120.0,180.0,60.0,3.0]},"kind":"numeric","n":354770,"n_null":294138,"n_unique":444,"null_rate":0.8290949065591792,"stats":{"iqr":570.0,"kurtosis":19379.843400645914,"max":66276000.0,"mean":5410.127843053173,"median":180.0,"min":0.01,"n_outliers":7753,"outlier_rate":0.12786977173769626,"q1":30.0,"q3":600.0,"skew":135.86110260966558,"std":414386.6738089271,"zero_rate":0.0}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"mass_g","extras":{},"kind":"unknown","n":354770,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"null_rate","level":"warn","message":"90.9% null"}],"column":"meteorite_class","extras":{"singletons":135,"top_values":[["L6",6544],["H5",5614],["H4",3336],["H6",3234],["L5",2750],["LL5",1899],["LL6",963],["L4",831],["H4/5",380],["CM2",281],["Iron, IIIAB",272],["H3",244],["LL",220],["E3",205],["L3",176],["LL4",160],["H5/6",156],["Ureilite",155],["Howardite",127],["Diogenite",125]]},"kind":"categorical","n":354770,"n_null":322584,"n_unique":395,"null_rate":0.9092764326183161,"stats":{"cardinality":395,"entropy":4.370365043700154,"entropy_ratio":0.5066673502681652,"top_rate":0.2033182128875909,"top_value":"L6"}},{"alerts":[{"code":"null_rate","level":"warn","message":"90.9% null"},{"code":"imbalance","level":"warn","message":"top value is 96.6% of rows"}],"column":"fall_type","extras":{"singletons":0,"top_values":[["Found",31090],["Fell",1096]]},"kind":"categorical","n":354770,"n_null":322584,"n_unique":2,"null_rate":0.9092764326183161,"stats":{"cardinality":2,"entropy":0.21432243547799887,"entropy_ratio":0.21432243547799887,"top_rate":0.9659479276704157,"top_value":"Found"}},{"alerts":[{"code":"null_rate","level":"warn","message":"76.7% null"}],"column":"magnitude","extras":{"singletons":79,"top_values":[["0",36675],["1",24542],["2",9904],["3",2630],["-9",1278],["4.5",686],["4",591],["4.6",558],["4.7",415],["1.75",383],["4.8",317],["5",297],["4.9",261],["2.75",220],["5.1",202],["5.2",167],["70.00",162],["50.00",151],["2.00",150],["5.3",126]]},"kind":"categorical","n":354770,"n_null":272093,"n_unique":294,"null_rate":0.7669560560363052,"stats":{"cardinality":294,"entropy":2.513568827762577,"entropy_ratio":0.30654503278359213,"top_rate":0.4435937443303458,"top_value":"0"}},{"alerts":[{"code":"null_rate","level":"warn","message":"98.9% null"},{"code":"high_skew","level":"info","message":"skew=+3.07"},{"code":"outliers","level":"warn","message":"8.4% rows beyond 1.5 IQR"}],"column":"depth_km","extras":{"histogram":{"counts":[219,1730,370,258,230,250,167,129,56,31,43,27,19,29,21,19,24,12,9,14,13,19,14,5,6,0,7,4,0,1,5,1,3,2,3,1,0,0,0,1],"edges":[-2.261,4.013025,10.28705,16.561075,22.8351,29.109125000000002,35.38314999999999,41.657174999999995,47.9312,54.205225,60.47925,66.753275,73.0273,79.301325,85.57535,91.84937500000001,98.1234,104.397425,110.67145000000001,116.945475,123.21950000000001,129.493525,135.76755,142.041575,148.3156,154.589625,160.86365,167.137675,173.4117,179.685725,185.95975,192.233775,198.5078,204.781825,211.05585,217.32987500000002,223.6039,229.877925,236.15195,242.425975,248.7]},"sample":[3.11744499206543,66.444,10.0,10.0,11.6,12.0,8.1,40.785,40.0,35.0,35.0,2.92,5.2,44.3,10.0,74.4,10.0,10.0,35.0,12.51,55.566,41.164,10.0,10.0,10.0,2.624,10.0,8.368,46.3,32.334,10.0,10.0,10.0,53.325,3.51,4.7,26.4,54.392,13.929,45.624,3.7,42.312,35.0,28.04,17.032,10.0,10.0,112.6,129.185,20.0,10.0,36.7,10.0,39.895,42.9,10.0,11.919,10.0,13.08,41.4,43.139,11.623,10.0,10.0,10.0,6.799975586,61.6,35.0,35.0,35.0,10.0,20.49,19.0,20.0,2.2,10.0,151.2,16.51,10.0,47.17,10.0,10.0,10.0,10.0,10.0,10.0,14.05,10.0,33.0,6.8,10.0,36.3,10.0,19.3,24.9,35.0,3.71,80.1,49.7,10.0,48.11,40.3,35.51,30.6,18.66,10.0,35.0,52.9,14.3,33.9,35.15,28.0,8.3,5.0,2.7,10.16,8.94,10.45,9.07,9.98,100.7,10.27,10.0,10.0,10.0,88.2,6.3,1.56,28.82,3.14,6.82,9.1,8.0,2.81,10.5,13.9,7.9,6.3,8.34,10.0,169.01,8.5,13.8,166.01,10.0,121.5,10.0,41.8,43.3,10.0,10.0,10.0,10.0,39.6,24.0,16.9,11.7,10.0,7.0,17.3,12.2,10.0,10.0,6.0,10.0,10.0,14.07,10.0,26.8,10.0,17.42,14.06,24.47,10.0,10.0,9.83,69.69,98.3,10.0,17.0,45.6,8.9,41.85,10.0,28.78,10.0,131.7,12.3,25.6,9.1,199.53,12.31,6.3,10.0,17.49,10.0,10.0,73.3,56.0,10.0,1.0,19.22,9.33,10.0,10.0,21.38,10.0,4.5,22.2,5.0,119.3,39.13,11.7,39.86,35.0,36.32,6.0,70.7,28.2,10.7,30.19,17.0,8.45,10.0,20.1,8.4,65.3,10.0,27.4,5.23,10.0,16.6,9.03,11.12,12.2,1.8,10.0,10.0,10.0,2.08,5.0,9.3,11.952,9.45,9.92,9.85,14.84,21.5,10.0,15.1,13.0,11.4,10.0,139.2,10.0,10.0,10.0,10.0,8.7,10.0,13.0,10.0,84.7,8.4,10.0,10.0,10.0,15.0,10.0,4.17,3.3,10.0,24.632,61.7,10.0,10.0,8.0,10.0,9.963,10.0,16.1,10.0,136.3,10.0,10.0,55.2,10.0,10.0,10.1,10.0,10.0,12.6,10.0,36.7,5.0,29.0,136.2,10.0,36.0,46.2,31.9,18.0,248.7,13.146,10.0,153.1,10.0,10.0,9.939,10.0,10.0,4.8,6.8,3.1,6.7,4.8,10.9,10.0,50.7,38.5,8.073,10.0,4.6,3.278,10.0,16.603,4.085,35.0,31.6,89.2,4.9,10.0,10.0,39.8,10.0,10.0,10.0,11.5,9.987,10.0,10.0,10.0,19.0,33.0,13.7,20.4,51.6,25.7,6.006,24.4,10.0,14.987,10.0,10.0,10.0,10.0,31.1,10.0,25.9,10.0,10.0,10.0,10.0,3.535,2.8,14.25,10.0,31.2,10.0,10.0,27.6,10.0,10.0,6.001,26.1,10.0,8.8,26.9,13.2,37.0,10.0,10.0,5.9,10.0,45.5,10.0,47.3,25.8,10.0,10.0,10.0,4.725,56.6,10.0,0.2,10.0,10.0,10.0,10.0,38.5,20.064,10.0,10.0,26.7,33.3,19.4,1.8,14.0,44.1,93.1,40.3,10.0,10.0,10.0,19.8,10.0,10.0,10.0,10.0,37.1,10.0,37.6,54.7,27.274,10.0,32.1,166.7,37.7,30.1,61.7,36.2,122.9,5.5,10.0,17.4,16.3,10.0,5.589,75.2,10.0,7.347,33.0,5.0,1.0,1.0,3.6,0.7,6.6,5.6,0.8,0.9,2.7,1.0,4.2,3.67,45.8,63.2,33.0,0.0,17.195,18.0,33.0,33.0,6.791,4.83,7.007,33.0,40.5,13.678,10.0,33.0,10.0,10.0,10.0,-0.706,10.0,10.0,133.8,43.9,10.0,36.4,22.2,8.6,2.243,10.0,33.3,32.9,23.4,9.367,58.1,37.8,33.0,10.0,33.0,23.0,35.6,3.62,10.0,18.1,23.9]},"kind":"numeric","n":354770,"n_null":351028,"n_unique":1505,"null_rate":0.9894523212222003,"stats":{"iqr":19.1015,"kurtosis":11.610703248129315,"max":248.7,"mean":23.7120293534754,"median":10.0,"min":-2.261,"n_outliers":314,"outlier_rate":0.08391234633885623,"q1":10.0,"q3":29.1015,"skew":3.071857409692146,"std":28.78969272671201,"zero_rate":0.002672367717797969}},{"alerts":[{"code":"null_rate","level":"warn","message":"98.9% null"}],"column":"place","extras":{"language_counts":{"__engine":"fasttext:54","en":54},"language_sample_size":5000,"length_histogram":{"counts":[1,0,1,0,0,0,2,11,40,1,20,19,8,219,60,122,543,499,823,325,362,378,105,40,37,25,34,3,0,15,22,14,3,1,2,5,0,0,0,2],"edges":[4.0,5.375,6.75,8.125,9.5,10.875,12.25,13.625,15.0,16.375,17.75,19.125,20.5,21.875,23.25,24.625,26.0,27.375,28.75,30.125,31.5,32.875,34.25,35.625,37.0,38.375,39.75,41.125,42.5,43.875,45.25,46.625,48.0,49.375,50.75,52.125,53.5,54.875,56.25,57.625,59.0]},"near_unique":false,"sample":["88 km N of Yakutat, Alaska","100 km SW of Topolobampo, Mexico","Gulf of Alaska","8 km NNW of Tahoe Vista, California","88 km SSW of Nikolski, Alaska","33 km NE of Chignik, Alaska","204 km W of Port McNeill, Canada","69 km S of Nikolski, Alaska","181 km W of Ferndale, California","47 km NW of Ninilchik, Alaska","110 km SSW of El Huitusi, Mexico","274 km SSW of Prince Rupert, Canada","68 km S of Shungnak, Alaska","132 km SE of Akutan, Alaska","70 km ENE of Loreto, Mexico","73 km N of Chickaloon, Alaska","108km W of Petrolia, CA","111 km SSE of Akhiok, Alaska","51 km SSW of San Carlos, Mexico","18 km SE of Waynoka, Oklahoma","210 km SW of Port McNeill, Canada","66 km ENE of Chase, Alaska","off the coast of Oregon","44 km ESE of Peace River, Canada","52 km WNW of Nanwalek, Alaska","210 km W of Port McNeill, Canada","83 km ENE of San Luis, Mexico","290 km W of Bandon, Oregon","50 km SSW of Covenant Life, Alaska","72 km SE of Akhiok, Alaska","51 km SSE of Akutan, Alaska","134 km ESE of Nikolski, Alaska","71 km NNE of Santa Rosal\u00eda, Mexico","245 km W of Bandon, Oregon","49 km SW of False Pass, Alaska","64 km S of Arctic Village, Alaska","off the east coast of the United States","67 km SSW of Port Alexander, Alaska","227 km WNW of Port McNeill, Canada","256 km SSW of Prince Rupert, Canada","21 km N of Leadore, Idaho","208 km SSE of King Cove, Alaska","66 km S of Shungnak, Alaska","155 km S of False Pass, Alaska","110 km ESE of Akutan, Alaska","72 km NNE of Villa Alberto Andr\u00e9s Alvarado Ar\u00e1mburo, Mexico","197 km W of Port McNeill, Canada","64 km SE of Denali National Park, Alaska","94 km W of La Libertad, Mexico","83 km ESE of McKinley Park, Alaska"],"top_values":[["off the coast of Oregon",151],["south of Alaska",13],["Fox Islands, Aleutian Islands, Alaska",12],["Alaska Peninsula",10],["Southern Alaska",10],["104 km SSW of Nikolski, Alaska",7],["Unimak Island region, Alaska",7],["Vancouver Island, Canada region",7],["Haida Gwaii Region, Canada",7],["North Atlantic Ocean",7],["155 km S of False Pass, Alaska",7],["85 km SSE of Nikolski, Alaska",6],["92 km SSW of Nikolski, Alaska",5],["141 km S of False Pass, Alaska",5],["154 km S of False Pass, Alaska",5],["Gulf of Alaska",5],["Kodiak Island region, Alaska",5],["North Pacific Ocean",5],["82 km SSW of Nikolski, Alaska",5],["236 km W of Port McNeill, Canada",5]],"top_words":[["of",3618],["km",3220],["alaska",1991],["canada",472],["mexico",412],["se",397],["w",381],["ssw",379],["sse",373],["nikolski,",372],["oregon",283],["s",281],["sw",274],["port",262],["wsw",261],["mcneill,",216],["ese",202],["point,",182],["sand",173],["ca",172],["e",167],["wnw",166],["the",165],["off",159],["coast",159]],"vocab_skipped":null,"word_histogram":{"counts":[2,0,0,34,0,0,53,0,0,42,0,0,262,0,0,1821,0,0,1388,0,0,73,0,0,59,0,0,2,0,6],"edges":[1.0,1.3333333333333333,1.6666666666666665,2.0,2.333333333333333,2.6666666666666665,3.0,3.333333333333333,3.6666666666666665,4.0,4.333333333333333,4.666666666666666,5.0,5.333333333333333,5.666666666666666,6.0,6.333333333333333,6.666666666666666,7.0,7.333333333333333,7.666666666666666,8.0,8.333333333333332,8.666666666666666,9.0,9.333333333333332,9.666666666666666,10.0,10.333333333333332,10.666666666666666,11.0]}},"kind":"text","n":354770,"n_null":351028,"n_unique":3002,"null_rate":0.9894523212222003,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.19775521111704972,"emoji_rate":0.0,"len_max":59,"len_mean":29.465793693212184,"len_median":29.0,"len_min":4,"len_p95":36.0,"n_duplicates":740,"n_empty":0,"one_word_rate":0.0005344735435595938,"readability_flesch_mean":69.914087987013,"url_rate":0.0,"vocab_size":1036,"word_mean":6.293425975414217,"word_median":6.0}},{"alerts":[{"code":"null_rate","level":"warn","message":"98.9% null"},{"code":"imbalance","level":"warn","message":"top value is 99.9% of rows"}],"column":"earthquake_type","extras":{"singletons":1,"top_values":[["earthquake",3739],["explosion",2],["landslide",1]]},"kind":"categorical","n":354770,"n_null":351028,"n_unique":3,"null_rate":0.9894523212222003,"stats":{"cardinality":3,"entropy":0.010137662013180244,"entropy_ratio":0.006396152595766536,"top_rate":0.9991982896846606,"top_value":"earthquake"}},{"alerts":[{"code":"null_rate","level":"warn","message":"100.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"volcano_type","extras":{"singletons":0,"top_values":[["Unknown",170]]},"kind":"categorical","n":354770,"n_null":354600,"n_unique":1,"null_rate":0.9995208163035206,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Unknown"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"elevation_m","extras":{},"kind":"unknown","n":354770,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"null_rate","level":"warn","message":"100.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"status","extras":{"singletons":0,"top_values":[["Unknown",170]]},"kind":"categorical","n":354770,"n_null":354600,"n_unique":1,"null_rate":0.9995208163035206,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Unknown"}},{"alerts":[{"code":"null_rate","level":"warn","message":"100.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"last_eruption","extras":{"singletons":0,"top_values":[["Unknown",170]]},"kind":"categorical","n":354770,"n_null":354600,"n_unique":1,"null_rate":0.9995208163035206,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Unknown"}},{"alerts":[{"code":"null_rate","level":"warn","message":"75.6% null"}],"column":"injuries","extras":{"singletons":70,"top_values":[["0",73943],["1",3402],["2",1957],["3",1118],["4",727],["5",625],["6",500],["10",362],["7",332],["8",292],["12",280],["9",202],["20",185],["15",181],["11",170],["13",136],["14",124],["30",116],["25",100],["16",91]]},"kind":"categorical","n":354770,"n_null":268187,"n_unique":233,"null_rate":0.7559461059277842,"stats":{"cardinality":233,"entropy":1.2336561456806954,"entropy_ratio":0.15687016087726754,"top_rate":0.8540129124654955,"top_value":"0"}},{"alerts":[{"code":"null_rate","level":"warn","message":"75.6% null"}],"column":"fatalities","extras":{"singletons":13,"top_values":[["0",80397],["1",4053],["2",932],["3",357],["4",190],["5",121],["6",112],["7",71],["9",40],["10",39],["8",34],["11",34],["16",22],["13",19],["12",15],["17",13],["14",11],["21",9],["18",8],["20",8]]},"kind":"categorical","n":354770,"n_null":268187,"n_unique":57,"null_rate":0.7559461059277842,"stats":{"cardinality":57,"entropy":0.5134309123372227,"entropy_ratio":0.08802341739521811,"top_rate":0.9285541041543952,"top_value":"0"}},{"alerts":[{"code":"one_word","level":"warn","message":"100.0% rows are a single word"},{"code":"allcaps","level":"info","message":"100.0% rows are all-caps"},{"code":"null_rate","level":"warn","message":"79.8% null"},{"code":"short_text","level":"info","message":"95th-percentile length under 20 chars"},{"code":"duplicates","level":"warn","message":"94.7% duplicate strings"}],"column":"length_miles","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[47630,0,0,0,0,0,0,0,11687,0,0,0,0,0,0,0,795,0,0,0,0,0,0,0,10712,0,0,0,0,0,0,0,986,0,0,0,0,0,0,3],"edges":[3.0,3.125,3.25,3.375,3.5,3.625,3.75,3.875,4.0,4.125,4.25,4.375,4.5,4.625,4.75,4.875,5.0,5.125,5.25,5.375,5.5,5.625,5.75,5.875,6.0,6.125,6.25,6.375,6.5,6.625,6.75,6.875,7.0,7.125,7.25,7.375,7.5,7.625,7.75,7.875,8.0]},"near_unique":false,"sample":["0.7","1.7","0.0200","12.3","0.2","7.6000","0.1","0.6200","1.4","0.1","0.1","0.1","24.5","0.1","0.1","1.0","0.1","6.5900","6.0600","1.5","0.1","21.4","0.1","0.1","3.0","1.54","30.0","3.6","0.1","2.4000","0.2","0.3","0.7","0.5","0.2","0.3","3.6000","3.0","0.1","0.4","3.96","11.0200","0.2","0.3600","1.8000","0.9900","12.0","7.0","0.3","2.6200"],"top_values":[["0.1",15456],["0.5",4842],["1.0",4603],["0.2",4447],["2.0",2724],["0.3",2410],["3.0",1145],["1.5",1087],["5.0",738],["4.0",682],["0.8",572],["2.5",509],["6.0",457],["0.0100",412],["0.4",405],["8.0",399],["7.0",375],["10.0",363],["0.7",349],["0.1000",282]],"top_words":[["0.1",4255],["0.5",1335],["1.0",1304],["0.2",1230],["2.0",759],["0.3",650],["1.5",315],["3.0",312],["5.0",203],["4.0",182],["0.8",152],["2.5",139],["0.0100",129],["6.0",128],["8.0",120],["7.0",111],["0.7",99],["0.4",99],["0.1000",96],["10.0",94],["12.0",69],["0.6",68],["9.0",67],["3.5",66],["2.3",66]],"vocab_skipped":null,"word_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,71813,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[0.5,0.5333333333333333,0.5666666666666667,0.6,0.6333333333333333,0.6666666666666666,0.7,0.7333333333333334,0.7666666666666666,0.8,0.8333333333333333,0.8666666666666667,0.9,0.9333333333333333,0.9666666666666667,1.0,1.0333333333333332,1.0666666666666667,1.1,1.1333333333333333,1.1666666666666665,1.2,1.2333333333333334,1.2666666666666666,1.3,1.3333333333333335,1.3666666666666667,1.4,1.4333333333333333,1.4666666666666668,1.5]}},"kind":"text","n":354770,"n_null":282957,"n_unique":3795,"null_rate":0.7975787129689658,"stats":{"allcaps_rate":1.0,"boilerplate_rate":0.0,"duplicate_rate":0.9471544149387994,"emoji_rate":0.0,"len_max":8,"len_mean":3.6875078328436355,"len_median":3.0,"len_min":3,"len_p95":6.0,"n_duplicates":68018,"n_empty":0,"one_word_rate":1.0,"readability_flesch_mean":121.22000000000004,"url_rate":0.0,"vocab_size":2268,"word_mean":1.0,"word_median":1.0}},{"alerts":[{"code":"null_rate","level":"warn","message":"79.8% null"}],"column":"width_yards","extras":{"singletons":176,"top_values":[["10",14492],["50",10603],["100",7243],["30",4882],["20",4431],["200",3046],["25",2530],["150",2234],["75",2026],["40",2006],["300",1518],["33",1161],["17",1037],["400",977],["250",828],["23",812],["60",765],["440",682],["500",665],["80",605]]},"kind":"categorical","n":354770,"n_null":282957,"n_unique":437,"null_rate":0.7975787129689658,"stats":{"cardinality":437,"entropy":4.4931808880768545,"entropy_ratio":0.5122483363515538,"top_rate":0.2018019021625611,"top_value":"10"}},{"alerts":[{"code":"null_rate","level":"warn","message":"98.6% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"type","extras":{"singletons":0,"top_values":[["hot_spring",5003]]},"kind":"categorical","n":354770,"n_null":349767,"n_unique":1,"null_rate":0.9858979056853736,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"hot_spring"}},{"alerts":[{"code":"long_tail","level":"info","message":"34 singleton categories"},{"code":"null_rate","level":"warn","message":"98.6% null"},{"code":"imbalance","level":"warn","message":"top value is 97.4% of rows"}],"column":"temperature","extras":{"singletons":34,"top_values":[["",4874],["hot",73],["90",4],["100",4],["21",3],["95",3],["37",2],["43",2],["28",2],["40",2],["37-39\u00b0",1],["35-37 \u00b0C",1],["58\u00b0C",1],["52,1",1],["25-30",1],["98\u00b0C",1],["40-43\u00b0",1],["77",1],["25\u00b0C",1],["52",1]]},"kind":"categorical","n":354770,"n_null":349767,"n_unique":44,"null_rate":0.9858979056853736,"stats":{"cardinality":44,"entropy":0.256555462573728,"entropy_ratio":0.04699307189743052,"top_rate":0.9742154707175694,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"51.6% null"}],"column":"source","extras":{"singletons":0,"top_values":[["OpenStreetMap contributors",88396],["The Megalithic Portal",60028],["NOAA Storm Events Database",14770],["OpenStreetMap",8656]]},"kind":"categorical","n":354770,"n_null":182920,"n_unique":4,"null_rate":0.5156016574118443,"stats":{"cardinality":4,"entropy":1.5448347031842733,"entropy_ratio":0.7724173515921366,"top_rate":0.5143788187372709,"top_value":"OpenStreetMap contributors"}},{"alerts":[{"code":"long_tail","level":"info","message":"14 singleton categories"},{"code":"null_rate","level":"warn","message":"99.0% null"}],"column":"vessel_type","extras":{"singletons":14,"top_values":[["",3311],["ship",275],["submarine",18],["aircraft",16],["plane",10],["boat",3],["schooner",2],["car",2],["sailboat",2],["steamer",1],["airplane",1],["freightcar",1],["train",1],["paddle steamer",1],["vehicle",1],["motorbike",1],["helicopter",1],["Steam hoist",1],["tractor",1],["Airplane",1]]},"kind":"categorical","n":354770,"n_null":351117,"n_unique":23,"null_rate":0.9897031879809454,"stats":{"cardinality":23,"entropy":0.576412765750529,"entropy_ratio":0.12742453211649218,"top_rate":0.9063783191897071,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"13 singleton categories"},{"code":"null_rate","level":"warn","message":"99.0% null"},{"code":"imbalance","level":"warn","message":"top value is 99.4% of rows"}],"column":"cargo","extras":{"singletons":13,"top_values":[["",3632],["human",4],["timber",2],["coal",2],["fertilizer",1],["ore pellets",1],["Fischkutter (Stahl)",1],["seafood",1],["fish",1],["passengers",1],["mexican army supposed drugs, but the crew and cargo was not found",1],["iron ore",1],["pulp",1],["18 mines, 6 torpedos",1],["sugar",1],["containers;vehicles",1],["container;oil",1]]},"kind":"categorical","n":354770,"n_null":351117,"n_unique":17,"null_rate":0.9897031879809454,"stats":{"cardinality":17,"entropy":0.07301985554225272,"entropy_ratio":0.017864347243806682,"top_rate":0.9942513003011224,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"99.8% null"}],"column":"peak_brightness_altitude_km","extras":{"singletons":111,"top_values":[["37.0",35],["31.5",15],["33.3",15],["38.0",11],["29.6",11],["35.2",11],["40.7",11],["32.0",10],["26.0",10],["32.4",9],["42.0",8],["26.5",8],["33.0",8],["25.0",7],["50.0",7],["36.0",7],["35.0",6],["39.0",6],["28.7",6],["37",6]]},"kind":"categorical","n":354770,"n_null":354193,"n_unique":224,"null_rate":0.9983735941595964,"stats":{"cardinality":224,"entropy":7.187137873819712,"entropy_ratio":0.9205599009613827,"top_rate":0.060658578856152515,"top_value":"37.0"}},{"alerts":[{"code":"null_rate","level":"warn","message":"99.9% null"}],"column":"velocity_km_s","extras":{"singletons":65,"top_values":[["13.6",6],["15.2",6],["16.9",6],["17.8",5],["20.1",5],["17.4",5],["13.1",5],["16.2",5],["19.8",5],["16.5",5],["15.9",5],["14.1",5],["18.1",5],["14.9",5],["12.9",5],["12.2",5],["19.6",4],["17.0",4],["14.4",4],["18.3",4]]},"kind":"categorical","n":354770,"n_null":354421,"n_unique":158,"null_rate":0.999016264058404,"stats":{"cardinality":158,"entropy":7.052191926122492,"entropy_ratio":0.9655536179508943,"top_rate":0.017191977077363897,"top_value":"13.6"}},{"alerts":[{"code":"long_tail","level":"info","message":"361 singleton categories"},{"code":"null_rate","level":"warn","message":"99.8% null"}],"column":"energy_joules","extras":{"singletons":361,"top_values":[["2.1",15],["2.0",13],["3.2",13],["3.0",10],["2.8",8],["2.3",8],["3.5",8],["2.7",8],["2.2",8],["4.1",8],["3.3",7],["2.5",7],["4.0",6],["2.9",6],["3.1",6],["5.8",6],["10.4",6],["11.8",6],["3.6",5],["4.4",5]]},"kind":"categorical","n":354770,"n_null":353907,"n_unique":518,"null_rate":0.9975674380584604,"stats":{"cardinality":518,"entropy":8.634265674041822,"entropy_ratio":0.9575744984877702,"top_rate":0.01738122827346466,"top_value":"2.1"}},{"alerts":[{"code":"null_rate","level":"warn","message":"95.8% null"}],"column":"event_type","extras":{"singletons":4,"top_values":[["Tornado",6334],["Flash Flood",2358],["Thunderstorm Wind",2257],["Flood",1777],["Hail",1246],["Lightning",574],["Heavy Rain",99],["Marine Strong Wind",43],["Debris Flow",43],["Marine Thunderstorm Wind",25],["Marine High Wind",5],["Dust Devil",3],["Waterspout",2],["Tropical Storm",1],["High Wind",1],["Heat",1],["Marine Lightning",1]]},"kind":"categorical","n":354770,"n_null":340000,"n_unique":17,"null_rate":0.9583673929588183,"stats":{"cardinality":17,"entropy":2.336076472984396,"entropy_ratio":0.5715223755452659,"top_rate":0.4288422477995938,"top_value":"Tornado"}},{"alerts":[{"code":"one_word","level":"warn","message":"100.0% rows are a single word"},{"code":"allcaps","level":"info","message":"87.2% rows are all-caps"},{"code":"null_rate","level":"warn","message":"95.8% null"},{"code":"short_text","level":"info","message":"95th-percentile length under 20 chars"},{"code":"duplicates","level":"warn","message":"93.1% duplicate strings"}],"column":"damage_property","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[368,0,0,0,0,264,0,0,0,0,1252,0,0,0,0,1172,0,0,0,0,3414,0,0,0,0,6075,0,0,0,0,1450,0,0,0,0,514,0,0,0,261],"edges":[0.0,0.2,0.4,0.6000000000000001,0.8,1.0,1.2000000000000002,1.4000000000000001,1.6,1.8,2.0,2.2,2.4000000000000004,2.6,2.8000000000000003,3.0,3.2,3.4000000000000004,3.6,3.8000000000000003,4.0,4.2,4.4,4.6000000000000005,4.800000000000001,5.0,5.2,5.4,5.6000000000000005,5.800000000000001,6.0,6.2,6.4,6.6000000000000005,6.800000000000001,7.0,7.2,7.4,7.6000000000000005,7.800000000000001,8.0]},"near_unique":false,"sample":["250K","40.00M","3.00M","20.00K","3.17M","15.00M","1.00M","0.00K","0.00K","25K","3.00M","10.00M","1M","25K",".15M","2.5M","2.5M","5.40M","0.00K","1.5M","2.7M","2.5M","2.5M","2.5M","1.50M","986.00K","2.50M","0","2.5M","","5.00M","161.10M","3.00M","150K","3.5M","13M","8.00M","6.50M","0.00K","5.60M","9.20M","0.00K","15M","3.10M","","3.50M","5K","1M","2.5M","15.00K"],"top_values":[["2.5M",2278],["1.00M",1306],["0.00K",1229],["2.00M",553],["25M",530],["250K",471],["1M",457],["",368],["1.50M",334],["5.00M",325],["3.00M",297],["0",264],["2M",231],["10.00M",212],["5M",182],["25K",178],["4.00M",155],["2.50M",136],["1.5M",123],["10.00K",113]],"top_words":[["2.5m",2278],["1.00m",1306],["0.00k",1229],["2.00m",553],["25m",530],["250k",471],["1m",457],["1.50m",334],["5.00m",325],["3.00m",297],["0",264],["2m",231],["10.00m",212],["5m",182],["25k",178],["4.00m",155],["2.50m",136],["1.5m",123],["10.00k",113],["0k",111],["3m",109],["1.20m",109],["1000.00k",102],["10m",92],["50.00m",78]],"vocab_skipped":null,"word_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,14770,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[0.5,0.5333333333333333,0.5666666666666667,0.6,0.6333333333333333,0.6666666666666666,0.7,0.7333333333333334,0.7666666666666666,0.8,0.8333333333333333,0.8666666666666667,0.9,0.9333333333333333,0.9666666666666667,1.0,1.0333333333333332,1.0666666666666667,1.1,1.1333333333333333,1.1666666666666665,1.2,1.2333333333333334,1.2666666666666666,1.3,1.3333333333333335,1.3666666666666667,1.4,1.4333333333333333,1.4666666666666668,1.5]}},"kind":"text","n":354770,"n_null":340000,"n_unique":1014,"null_rate":0.9583673929588183,"stats":{"allcaps_rate":0.872444143534191,"boilerplate_rate":0.0,"duplicate_rate":0.9313473256601219,"emoji_rate":0.0,"len_max":8,"len_mean":4.380568720379147,"len_median":5.0,"len_min":0,"len_p95":7.0,"n_duplicates":13756,"n_empty":368,"one_word_rate":1.0,"readability_flesch_mean":116.97730000000003,"url_rate":0.0,"vocab_size":1013,"word_mean":1.0,"word_median":1.0}},{"alerts":[{"code":"long_tail","level":"info","message":"3 singleton categories"},{"code":"null_rate","level":"warn","message":"100.0% null"}],"column":"cave_type","extras":{"singletons":3,"top_values":[["pit",36],["ponor",2],["showcave",1],["sinkhole",1],["overhang",1]]},"kind":"categorical","n":354770,"n_null":354729,"n_unique":5,"null_rate":0.9998844321673197,"stats":{"cardinality":5,"entropy":0.7693251740833704,"entropy_ratio":0.33133031801343993,"top_rate":0.8780487804878049,"top_value":"pit"}},{"alerts":[{"code":"long_tail","level":"info","message":"158 singleton categories"},{"code":"null_rate","level":"warn","message":"99.8% null"}],"column":"cave_length_m","extras":{"singletons":158,"top_values":[["5",32],["6",26],["10",25],["3",23],["4",23],["7",20],["8",19],["15",16],["20",14],["12",13],["30",13],["2",11],["11",9],["60",8],["4.5",8],["13",8],["16",8],["17",8],["25",8],["9",7]]},"kind":"categorical","n":354770,"n_null":354128,"n_unique":237,"null_rate":0.9981903768638837,"stats":{"cardinality":237,"entropy":6.91866052861727,"entropy_ratio":0.8770294976431803,"top_rate":0.04984423676012461,"top_value":"5"}},{"alerts":[{"code":"long_tail","level":"info","message":"88 singleton categories"},{"code":"null_rate","level":"warn","message":"99.9% null"}],"column":"cave_depth_m","extras":{"singletons":88,"top_values":[["0",63],["10",13],["3",11],["1",9],["5",9],["4",8],["25",7],["30",6],["6",6],["2",6],["11",5],["35",5],["28",4],["14",4],["40",4],["70",4],["12",3],["8",3],["15",3],["23",3]]},"kind":"categorical","n":354770,"n_null":354472,"n_unique":124,"null_rate":0.9991600191673479,"stats":{"cardinality":124,"entropy":5.797302195708671,"entropy_ratio":0.8336408604182984,"top_rate":0.21140939597315436,"top_value":"0"}},{"alerts":[{"code":"null_rate","level":"warn","message":"98.0% null"}],"column":"access","extras":{"singletons":7,"top_values":[["yes",2753],["no",2279],["private",830],["permit",586],["permissive",448],["customers",273],["unknown",51],["destination",11],["restricted",9],["tidal",2],["request",2],["key",2],["discouraged",2],["designated",1],["official",1],["forestry",1],["agricultural",1],["guided",1],["university",1],["cancello_all'ingresso",1]]},"kind":"categorical","n":354770,"n_null":347515,"n_unique":20,"null_rate":0.9795501310708347,"stats":{"cardinality":20,"entropy":2.2342922281044104,"entropy_ratio":0.5169665434155355,"top_rate":0.37946243969676086,"top_value":"yes"}},{"alerts":[{"code":"one_word","level":"warn","message":"93.6% rows are a single word"},{"code":"allcaps","level":"info","message":"85.6% rows are all-caps"},{"code":"null_rate","level":"warn","message":"97.9% null"},{"code":"short_text","level":"info","message":"95th-percentile length under 20 chars"}],"column":"cave_ref","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[36,210,356,954,412,1123,2763,1372,232,29,44,28,11,0,2,2,3,3,1,1,1,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,1],"edges":[1.0,1.925,2.85,3.7750000000000004,4.7,5.625,6.550000000000001,7.4750000000000005,8.4,9.325000000000001,10.25,11.175,12.100000000000001,13.025,13.950000000000001,14.875,15.8,16.725,17.650000000000002,18.575,19.5,20.425,21.35,22.275000000000002,23.200000000000003,24.125,25.05,25.975,26.900000000000002,27.825000000000003,28.75,29.675,30.6,31.525000000000002,32.45,33.375,34.300000000000004,35.225,36.15,37.075,38.0]},"near_unique":false,"sample":["C 23","3125","JP-88","12","5381-116","5372-60","1862/15a","102","1008","1868/28","4732-10","4423-74","1873/22b","1547/9","3092","1861/21b","1915/43","218","4430-3","3163","2782/27","1866/51","1866/104","6847/10","2445","3128","1853/138","1863/39","1913/7","5341-64","477-031z","2911/29b","1313","1867/64b","288LO","5372-8","4423-64","1863/146","2726/1","388LO","1167","4120-129","7623/3","4120-149","4630-25","BL 206/003","6845/69a","D 121","1911/96","4450-24"],"top_values":[["6847/K1",26],["1852/18b",9],["4",8],["20",6],["3",5],["5",5],["4762-2",5],["41",5],["6",5],["10",5],["24",5],["21",5],["23",5],["no",4],["A161",4],["15",4],["8",4],["89",4],["5430-1",4],["4840-1",4]],"top_words":[["ra",143],["d",88],["c",72],["pu",35],["6847/k1",26],["f",22],["b",20],["la",12],["4",11],["v",9],["1852/18b",9],["44",8],["5",8],["33",8],["h",8],["17",8],["42",8],["a",8],["20",8],["6",7],["21",7],["|",7],["na",7],["23",6],["14",6]],"vocab_skipped":null,"word_histogram":{"counts":[7100,0,0,0,0,0,0,462,0,0,0,0,0,0,0,20,0,0,0,0,0,0,3,0,0,0,0,0,0,1],"edges":[1.0,1.1333333333333333,1.2666666666666666,1.4,1.5333333333333332,1.6666666666666665,1.8,1.9333333333333333,2.0666666666666664,2.2,2.333333333333333,2.466666666666667,2.6,2.7333333333333334,2.8666666666666667,3.0,3.1333333333333333,3.2666666666666666,3.4,3.533333333333333,3.6666666666666665,3.8,3.933333333333333,4.066666666666666,4.2,4.333333333333334,4.466666666666667,4.6,4.733333333333333,4.866666666666667,5.0]}},"kind":"text","n":354770,"n_null":347184,"n_unique":7162,"null_rate":0.9786171322265129,"stats":{"allcaps_rate":0.8559187977853941,"boilerplate_rate":0.0,"duplicate_rate":0.055892433430002636,"emoji_rate":0.0,"len_max":38,"len_mean":6.340891115212233,"len_median":7.0,"len_min":1,"len_p95":8.0,"n_duplicates":424,"n_empty":0,"one_word_rate":0.9359346163986291,"readability_flesch_mean":117.76495000000003,"url_rate":0.0,"vocab_size":7005,"word_mean":1.06788821513314,"word_median":1.0}},{"alerts":[{"code":"null_rate","level":"warn","message":"75.1% null"}],"column":"osm_id","extras":{"histogram":{"counts":[3968,2767,3230,3501,3041,2397,1663,1794,2343,2457,2751,2046,1826,2556,2957,2055,1481,1420,2234,1597,2035,2535,2516,1909,2018,1425,2194,1852,3471,2391,1034,1192,1627,3575,1447,1836,1355,2246,1582,2072],"edges":[1334095.0,338043085.15,674752075.3,1011461065.4499999,1348170055.6,1684879045.75,2021588035.8999999,2358297026.0499997,2695006016.2,3031715006.35,3368423996.5,3705132986.6499996,4041841976.7999997,4378550966.95,4715259957.099999,5051968947.25,5388677937.4,5725386927.549999,6062095917.7,6398804907.849999,6735513898.0,7072222888.15,7408931878.299999,7745640868.45,8082349858.599999,8419058848.749999,8755767838.9,9092476829.05,9429185819.199999,9765894809.349998,10102603799.5,10439312789.65,10776021779.8,11112730769.949999,11449439760.099998,11786148750.25,12122857740.4,12459566730.55,12796275720.699999,13132984710.849998,13469693701.0]},"sample":[335634789.0,344524946.0,367532102.0,427075475.0,540167863.0,655156576.0,658939634.0,690978041.0,745732078.0,766770797.0,778197264.0,779080713.0,823751254.0,828668617.0,861256358.0,861256643.0,861257567.0,861258141.0,861258184.0,918735580.0,958274573.0,981449084.0,986022029.0,1255446579.0,1329693440.0,1347268846.0,1372949297.0,1373516268.0,1550070909.0,1612934350.0,1616608609.0,1663133732.0,1696510777.0,1706213701.0,1706213908.0,1711142491.0,1724243187.0,1737271853.0,1746677987.0,1750764037.0,1760101550.0,1769673853.0,1792277533.0,1806623449.0,1807673949.0,1836483302.0,1844348279.0,1976969322.0,2059751748.0,2065762176.0,2104789608.0,2134166402.0,2169637852.0,2279794401.0,2302621684.0,2326381777.0,2351101940.0,2358240817.0,2397795680.0,2415394133.0,2428129418.0,2470473465.0,2501127235.0,2507209570.0,2525613333.0,2596028129.0,2612085143.0,2618905537.0,2778226613.0,2778226629.0,2789327169.0,2795822089.0,2801480885.0,2813830231.0,2855268975.0,2866848488.0,2921803875.0,2971205537.0,2973065043.0,2981984954.0,3003081756.0,3008237210.0,3137844507.0,3142730034.0,3142733138.0,3160082113.0,3160885959.0,3184309782.0,3184327585.0,3187057566.0,3220022176.0,3277377579.0,3287419748.0,3323401916.0,3387910610.0,3389064371.0,3424972272.0,3437149580.0,3437150019.0,3494812595.0,3507254424.0,3583975602.0,3600450498.0,3640400865.0,3649612504.0,3659213476.0,3679582663.0,3686881861.0,3855447437.0,4026442065.0,4081963316.0,4086768866.0,4172814661.0,4185669267.0,4244921112.0,4261545880.0,4314207082.0,4337913245.0,4340295164.0,4362391968.0,4393974273.0,4411116124.0,4530498298.0,4563506777.0,4573189069.0,4621854035.0,4626807321.0,4681548143.0,4687225474.0,4790142221.0,4801817756.0,4801817770.0,4801817781.0,4804177218.0,4855786079.0,4868792914.0,4869910574.0,4877463119.0,4894898934.0,4915326021.0,4922948459.0,4933645339.0,4935713613.0,4935721263.0,4947181615.0,4983869273.0,5018305083.0,5037906007.0,5052320563.0,5081582522.0,5092429989.0,5115776588.0,5136212840.0,5188408735.0,5228590662.0,5240732250.0,5246328959.0,5246329193.0,5262208401.0,5300966072.0,5310934627.0,5325808066.0,5412323757.0,5414229298.0,5415322506.0,5526891603.0,5618381424.0,5627645999.0,5673531526.0,5725217600.0,5760073565.0,5779163795.0,5842410362.0,5929011322.0,6027045395.0,6027225654.0,6174547732.0,6329709187.0,6348112101.0,6352770863.0,6357009346.0,6357009363.0,6357010117.0,6368677036.0,6368677049.0,6372990943.0,6442333995.0,6476931738.0,6597642956.0,6604435070.0,6771083296.0,7029343770.0,7061963418.0,7073923111.0,7076551885.0,7078381159.0,7078702213.0,7078773529.0,7117833447.0,7172725330.0,7211572890.0,7223331150.0,7241185682.0,7276457460.0,7381491220.0,7412169726.0,7415025331.0,7425776959.0,7433019274.0,7438981763.0,7439530475.0,7444525663.0,7454029194.0,7464656965.0,7465075702.0,7486257776.0,7499495242.0,7501577421.0,7538965058.0,7554248793.0,7606516637.0,7622959163.0,7631850085.0,7636235818.0,7636242726.0,7636242729.0,7636242740.0,7728125373.0,7761577775.0,7783475082.0,7809288904.0,7816026392.0,7824056298.0,7841016246.0,7862277380.0,7881862384.0,7900649572.0,7921262795.0,7921813425.0,7938822989.0,7945899363.0,7952118818.0,8016871016.0,8041591953.0,8165446480.0,8238347288.0,8296594453.0,8322200858.0,8361419727.0,8389114917.0,8403415003.0,8410667979.0,8442364495.0,8446541545.0,8511580748.0,8538601863.0,8541936176.0,8557649817.0,8570784581.0,8630622137.0,8636538236.0,8680701538.0,8740002292.0,8807314840.0,8863438057.0,8949755465.0,8983503677.0,8997115617.0,9032945381.0,9167068117.0,9186535921.0,9329415869.0,9341903343.0,9363490711.0,9383216862.0,9383908382.0,9403207943.0,9406241669.0,9476413690.0,9483688129.0,9500071382.0,9502190903.0,9502482344.0,9505123128.0,9505124951.0,9510599421.0,9521479292.0,9521847809.0,9523029932.0,9530393338.0,9533534659.0,9557467045.0,9598466790.0,9705481672.0,9730236131.0,9748255342.0,9784475309.0,9846819199.0,9904934225.0,10000390210.0,10022306675.0,10064553869.0,10088777557.0,10135958813.0,10160035916.0,10178878213.0,10300219203.0,10568258786.0,10695491615.0,10791146615.0,10815331044.0,10817147496.0,10844547886.0,10858060391.0,10926171694.0,10948644988.0,10948644989.0,10951875936.0,10958628240.0,11080021936.0,11227969602.0,11276729859.0,11286854949.0,11307577517.0,11307577597.0,11307577657.0,11307577817.0,11307577887.0,11307577938.0,11307577953.0,11307578013.0,11307578124.0,11307578251.0,11307578368.0,11307578488.0,11307578800.0,11307578945.0,11307579339.0,11330210241.0,11362578887.0,11409739091.0,11420065534.0,11464749578.0,11510596489.0,11764097966.0,11769763067.0,11774120968.0,11780229616.0,11844568090.0,11846479958.0,11865825041.0,11891062746.0,11892231634.0,12122852037.0,12141774084.0,12141951678.0,12148729455.0,12201420011.0,12253282166.0,12262792421.0,12273175098.0,12330592668.0,12388658490.0,12467359196.0,12525922221.0,12574227883.0,12595897467.0,12653311997.0,12661254608.0,12681096307.0,12695940277.0,12748832413.0,12750001830.0,12759976686.0,12762880018.0,12823702628.0,12844260009.0,12874758958.0,12883314477.0,12889306208.0,12912163901.0,13022991191.0,13027927900.0,13067897927.0,13076113602.0,13088193007.0,13119465689.0,13136939207.0,13146846617.0,13169305134.0,13254057218.0,13272756495.0,13276235717.0,13285952972.0,13289548969.0,13289892839.0,13352723711.0,13353832440.0,13363416740.0,13398465440.0,13421970477.0,13423481435.0,13452521449.0,1033828041.0,1082074464.0,1115503456.0,1258280518.0,242987968.0,243023265.0,243023523.0,243030678.0,243032194.0,243038122.0,243039318.0,243041145.0,243045100.0,337658653.0,337659749.0,534097295.0,600917219.0,619200004.0,746698949.0,767046451.0,804939508.0,818903928.0,824769005.0,888411499.0,1106253733.0,1165104003.0,1235708725.0,1293173675.0,1319064736.0,1332098700.0,1362383001.0,1376298942.0,1382226209.0,1422711436.0,1424940580.0,1718134355.0,2033296100.0,2517671681.0,3050757794.0,3160605535.0,3425029176.0,3450362791.0,3483825595.0,3492711936.0,3690011446.0,3812851555.0,3813603161.0,4108941846.0,4458127688.0,4641738641.0,5048878295.0,5265979990.0,6405891054.0,6405891068.0,6700404554.0,7096935279.0,7239074224.0,7391204075.0,7617677520.0,7643982543.0,7648522413.0,8412483892.0,8479637345.0,8522672254.0,8747450022.0,8771756653.0,8870084647.0,8871922569.0,8893129084.0,9758802216.0,9828435312.0,9835169900.0,10570013142.0,10807313458.0,10946928419.0,11367854035.0,11570654525.0,11882402467.0,12096601734.0,12796251256.0,12847448323.0,12861129142.0,13416168376.0,13420945154.0,13423761459.0,13447729872.0,94226641.0,105200825.0,355765226.0,740134775.0,932874964.0,1113701948.0,1238115288.0,1429969767.0,7659788.0,7660357.0,7663210.0]},"kind":"numeric","n":354770,"n_null":266374,"n_unique":88395,"null_rate":0.7508357527412126,"stats":{"iqr":6902713242.5,"kurtosis":-1.2284091976144316,"max":13469693701.0,"mean":6182550152.988608,"median":6047018322.5,"min":1334095.0,"n_outliers":0,"outlier_rate":0.0,"q1":2627612475.25,"q3":9530325717.75,"skew":0.13212538540986568,"std":3992760870.7543554,"zero_rate":0.0}},{"alerts":[{"code":"null_rate","level":"warn","message":"75.1% null"},{"code":"imbalance","level":"warn","message":"top value is 96.4% of rows"}],"column":"osm_type","extras":{"singletons":0,"top_values":[["node",85204],["way",2560],["relation",632]]},"kind":"categorical","n":354770,"n_null":266374,"n_unique":3,"null_rate":0.7508357527412126,"stats":{"cardinality":3,"entropy":0.250087766358402,"entropy_ratio":0.15778781279974283,"top_rate":0.9638897687678175,"top_value":"node"}},{"alerts":[{"code":"long_tail","level":"info","message":"31 singleton categories"},{"code":"null_rate","level":"warn","message":"94.9% null"}],"column":"place_type","extras":{"singletons":31,"top_values":[["hamlet",12086],["isolated_dwelling",2977],["village",2388],["locality",251],["yes",131],["farm",122],["neighbourhood",73],["town",38],["suburb",23],["quarter",7],["square",7],["island",4],["local",4],["allotments",4],["house",3],["city",3],["islet",2],["county",1],["bus_station",1],["hamtel",1]]},"kind":"categorical","n":354770,"n_null":336616,"n_unique":48,"null_rate":0.9488288186712518,"stats":{"cardinality":48,"entropy":1.4980368242580269,"entropy_ratio":0.2682268366286423,"top_rate":0.6657485953508868,"top_value":"hamlet"}},{"alerts":[{"code":"long_tail","level":"info","message":"97 singleton categories"},{"code":"null_rate","level":"warn","message":"99.7% null"}],"column":"abandoned_year","extras":{"singletons":97,"top_values":[["yes",534],["village",433],["2022",20],["1986",11],["hamlet",9],["1978",6],["1974",6],["1987",5],["2023",4],["1950",4],["1985",4],["1983",3],["~1500",3],["2013-12-02",3],["isolated_dwelling",3],["2022-12-26",3],["1946",3],["1938",3],["1955",3],["1962",3]]},"kind":"categorical","n":354770,"n_null":353545,"n_unique":147,"null_rate":0.9965470586577219,"stats":{"cardinality":147,"entropy":2.9386137647250816,"entropy_ratio":0.40815937503498584,"top_rate":0.4359183673469388,"top_value":"yes"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"abandoned_reason","extras":{},"kind":"unknown","n":354770,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"null_rate","level":"warn","message":"99.3% null"}],"column":"former_population","extras":{"singletons":30,"top_values":[["0",1251],["2010",574],["2024",244],["2010-10-14",81],["2008",69],["2021-08-31",53],["1999",37],["2009",12],["1",11],["2021",11],["2021-09-01",10],["2021-10-01",10],["1989",9],["2018-01-01",9],["2005",8],["2016",7],["10",7],["3",6],["2001",6],["2",6]]},"kind":"categorical","n":354770,"n_null":352243,"n_unique":75,"null_rate":0.9928770752882149,"stats":{"cardinality":75,"entropy":2.604815213728114,"entropy_ratio":0.4181876762126051,"top_rate":0.4950534230312624,"top_value":"0"}},{"alerts":[{"code":"long_tail","level":"info","message":"5 singleton categories"},{"code":"null_rate","level":"warn","message":"100.0% null"}],"column":"heritage","extras":{"singletons":5,"top_values":[["2",2],["8",1],["yes",1],["4",1],["district",1],["3",1]]},"kind":"categorical","n":354770,"n_null":354763,"n_unique":6,"null_rate":0.9999802689066155,"stats":{"cardinality":6,"entropy":2.5216406363433186,"entropy_ratio":0.9755037590061086,"top_rate":0.2857142857142857,"top_value":"2"}}],"insights":{"errors":[],"insights":[{"confidence":"high","critiques":[],"evidence_keys":["category.top_values","category.null_rate","duration_seconds.stats","depth_km.stats","shape.null_rate","damage_property.null_rate","source.top_values","fatalities.top_values","event_type.top_values"],"featured_charts":[{"caption":"Shows how records are split across the 14 source datasets \u2014 tornadoes, caves, and UFO sightings each dominate, but all 14 categories are present.","column":"category","kind":"bar"},{"caption":"For UFO sighting rows, 'light' is by far the most reported shape, followed by triangle and circle \u2014 look for the long tail of rarer forms.","column":"shape","kind":"bar"},{"caption":"Among storm-event rows, tornadoes vastly outnumber flash floods and thunderstorm winds, revealing a strong imbalance in weather event coverage.","column":"event_type","kind":"bar"},{"caption":"Extreme right-skew with a median of 180 seconds but a max of 66 million seconds \u2014 look for the spike near zero and the extreme outliers.","column":"duration_seconds","kind":"histogram"},{"caption":"L6 and H5 ordinary chondrites dominate meteorite finds, with a long tail of rarer classes worth noting for completeness of the record.","column":"meteorite_class","kind":"bar"}],"model":"anthropic:default","narrative":"This is a 354,770-row mashup of 14 heterogeneous 'strange places' datasets \u2014 spanning tornadoes, UFO sightings, cave entrances, meteorites, ghost towns, earthquakes, shipwrecks, and more \u2014 unified under a single 'category' column. The most important thing to examine first is the category distribution, which reveals that no single source dominates but tornadoes (~71K), caves (~70K), and UFO sightings (~61K) each make up roughly 17\u201320% of records. A second key signal is the pervasive sparsity: most domain-specific columns (depth_km, duration_seconds, shape, damage_property) carry null rates of 80\u201399%, meaning each column is only meaningful for the subset of rows belonging to its originating dataset. UFO sighting durations show extreme right-skew (median 180 s, max 66 million s) and earthquake depths are similarly skewed, both worth closer inspection within their respective subsets.","scope":"dataset","target":"__global__"},{"confidence":"high","critiques":[],"evidence_keys":["top_values","null_rate","duplicate_rate","n_duplicates","n_empty","n_unique","allcaps_rate","len_median","len_p95"],"model":"anthropic:default","narrative":"This column contains ISO-format date strings (YYYY-MM-DD), stored as text rather than a proper date type, representing what appear to be annual publication or release dates \u2014 all top values fall on January 1st of a given year, suggesting date precision is year-level only. Two major data quality issues stand out: a 41.88% null rate (including 17,854 empty strings) and an 88.6% duplicate rate across 354,770 rows with only 23,500 unique values. The 'allcaps' alert is a false positive from the Saturn parser \u2014 ISO date strings trigger it due to lack of lowercase letters.","role":"timestamp","scope":"column","target":"date","treatment":"Cast to date type, impute or flag the 41.88% nulls, and consider extracting year as an integer feature given all values are Jan-1 anchored."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","duplicate_rate","n_unique","top_values","len_mean","len_max","one_word_rate","allcaps_rate","n"],"model":"anthropic:default","narrative":"This column stores numeric distance measurements (miles) encoded as text strings \u2014 all values are single tokens like '0.1', '0.5', '1.0' with a mean character length of 3.69 and a max of 8. Two signals demand attention: the null rate is extremely high at 79.76%, meaning roughly four in five rows carry no value, and the duplicate rate among non-null values is 94.72%, reflecting a coarse, rounded measurement scale (only 3,795 unique values across 354,770 rows). The top value '0.1' alone appears 15,456 times, suggesting heavy concentration at short distances.","role":"feature","scope":"column","target":"length_miles","treatment":"Cast to float, investigate and handle the 79.76% nulls (impute or flag), then use directly or log-transform given likely right skew."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","duplicate_rate","n_unique","top_values","top_words","one_word_rate","vocab_size"],"model":"anthropic:default","narrative":"This column contains US city names, confirmed by top values (Seattle, Phoenix, Las Vegas, Portland, Los Angeles) and top words ('beach', 'san', 'lake', 'springs'). The most striking issue is the 82.91% null rate \u2014 only roughly 1 in 6 rows has a city value at all, making this field sparsely populated. Despite that sparsity, the duplicate rate among non-null values is 84.91%, indicating that populated rows cluster around a relatively small set of repeated cities (9,149 unique values from 4,862 vocab tokens). The word 'city' appearing 531 times in top_words suggests some entries may literally contain placeholder text like 'Kansas City' or 'Oklahoma City' rather than being data quality noise.","role":"feature","scope":"column","target":"city","treatment":"Impute or flag nulls (82.91% missing) before use; consider grouping rare cities or encoding as region/state for modelling."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","skew","kurtosis","median","mean","max","n_outliers","outlier_rate","min","q1","q3"],"model":"anthropic:default","narrative":"This column records event or session durations in seconds, with values ranging from 0.01 s to 66,276,000 s (~766 days). The most striking issue is that 82.91% of rows are null, meaning duration is only captured for roughly 1-in-6 records. Among non-null values the distribution is catastrophically right-skewed (skew = 135.86, kurtosis = 19,379.84): the median is just 180 s while the mean inflates to 5,410 s, and 7,753 rows (12.79% of non-null) are flagged as outliers\u2014the maximum of 66,276,000 s is almost certainly erroneous or represents a sentinel/unclosed-session value.","role":"feature","scope":"column","target":"duration_seconds","treatment":"Investigate and cap or remove extreme outliers (especially values near 66276000.0), impute or flag nulls explicitly, then log-transform before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","top_value","top_rate","n_unique","entropy_ratio","top_values"],"model":"anthropic:default","narrative":"This column stores OpenStreetMap geometry type classifications, taking only three possible values: 'node', 'way', and 'relation'. Two signals demand attention: 75.08% of the 354,770 rows are null, meaning OSM type is only recorded for roughly a quarter of records, and among the non-null values the distribution is severely imbalanced \u2014 'node' accounts for 96.39% of non-null entries (85,204 occurrences) versus 2,560 'way' and just 632 'relation'. The near-zero entropy ratio (0.158) confirms this column carries very little discriminative information as-is.","role":"feature","scope":"column","target":"osm_type","treatment":"Impute nulls as a distinct 'unknown' category, then one-hot encode; consider whether the 'way'/'relation' minority classes carry signal worth preserving or should be collapsed."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","top_value","top_rate","cardinality","n_unique","top_values"],"model":"anthropic:default","narrative":"This column classifies meteorite recovery type, distinguishing between specimens that were 'Found' (discovered without an observed fall) versus 'Fell' (witnessed falling). Striking is the 90.93% null rate, meaning only ~32,186 of 354,770 records have a value at all. Among those with values, the distribution is heavily skewed: 'Found' accounts for 96.6% (31,090) versus 'Fell' at just 3.4% (1,096), which aligns with real-world meteorite data but constitutes a severe class imbalance alert.","role":"label","scope":"column","target":"fall_type","treatment":"Impute nulls as a third category ('Unknown') or exclude from classification tasks; apply class-weighting or oversampling to address the 97:3 Found-to-Fell imbalance before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["duplicate_rate","n_duplicates","top_values","language_counts","len_median","len_mean","len_p95","alerts","n"],"model":"anthropic:default","narrative":"This column contains free-text descriptions of geographic or physical features \u2014 cave entrances, former hamlets, hot springs, shipwrecks, and tornado tracks (e.g. 'F0, 0.1mi long, 10yd wide') dominate the top values, suggesting a points-of-interest or geographic gazetteer dataset. The duplicate rate is strikingly high at 38.3%, driven by 136,053 repeated values out of 354,770 rows, largely from templated entries like 'Cave entrance' (52,067 occurrences) and storm-track boilerplate. Text is overwhelmingly English (4,893 sampled as English) but 21 languages are detected including German (28), Bashkir (13), Russian (9), and Belarusian (9), flagging a multilingual minority that may require separate handling. The wide spread between median length (40 chars) and mean (114 chars) with a p95 of 491 indicates a heavily right-skewed length distribution.","role":"free_text","scope":"column","target":"description","treatment":"Deduplicate or group templated entries before NLP; apply language detection and route non-English rows to language-specific pipelines; tokenize and embed for semantic modelling."},{"confidence":"high","critiques":[],"evidence_keys":["top_values","top_words","stats.duplicate_rate","stats.n_duplicates","n_unique","n","language_counts","alerts"],"model":"anthropic:default","narrative":"This column contains the name or title of individual records in what appears to be a multi-domain dataset covering natural features (caves), weather events (tornadoes by US state), and UFO sightings. The duplicate rate is strikingly high at 46.5%, driven largely by templated strings like 'Unnamed Cave' (19,962 occurrences) and repeated tornado/state/count patterns. Despite the predominantly English content (3,363 language-detected values skewing English), the multilingual alert flags 30 detected languages including German (230), French (279), Italian (236), Russian (102), and Spanish (156), suggesting internationally-sourced named entities mixed into the dataset. Analysts should note that near-half of values are non-unique, so this column cannot serve as a reliable identifier.","role":"label","scope":"column","target":"name","treatment":"Deduplicate or group by name pattern before use; consider splitting templated names (e.g. 'Tornado in TX, 48') into structured fields; embed free-form names if semantic similarity is needed."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","mean","median","skew","kurtosis","outlier_rate","n_outliers","zero_rate","null_rate"],"model":"anthropic:default","narrative":"This column contains geographic latitude values, ranging from -87.37\u00b0 to 88.5\u00b0, consistent with global coordinates. The distribution is surprisingly left-skewed (skew = -2.84) with high kurtosis (7.30), meaning there is a heavy tail toward negative (southern hemisphere) latitudes despite the median sitting at ~40.6\u00b0N \u2014 suggesting the bulk of records are mid-latitude northern hemisphere but a notable minority of extreme southern values pull the mean down. About 9.4% of rows (33,355) are flagged as outliers, likely driven by records near the poles or far southern hemisphere; the near-zero zero_rate (0.06%) is negligible but worth checking for sentinel nulls encoded as 0.","role":"feature","scope":"column","target":"latitude","treatment":"Retain as-is for geospatial modelling; investigate ~0.06% zero-value rows as possible null sentinels, and review 33,355 outlier records for data quality before clustering or distance-based methods."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","top_value","top_rate","n","n_unique","top_values","alerts"],"model":"anthropic:default","narrative":"This column captures the settlement/place classification type, likely from an OpenStreetMap-style geographic dataset, with values such as 'hamlet', 'isolated_dwelling', 'village', and 'town'. The most striking signal is the extreme null rate of 94.88%, meaning only ~18,400 of 354,770 rows carry a value \u2014 the column is essentially sparse. Among populated rows, 'hamlet' dominates at 66.57% of non-null values, and the presence of a raw 'yes' tag (131 occurrences) indicates dirty or uncleaned OSM data that needs remediation.","role":"label","scope":"column","target":"place_type","treatment":"Filter or impute nulls before use; remap 'yes' and other dirty values; treat as low-cardinality categorical with one-hot or ordinal encoding reflecting settlement hierarchy."},{"confidence":"high","critiques":[],"evidence_keys":["column","null_rate","n","n_unique","stats.min","stats.max","stats.kurtosis","stats.n_outliers"],"model":"anthropic:default","narrative":"This column contains OpenStreetMap (OSM) numeric identifiers, likely referencing geographic features such as ways, relations, or nodes in the OSM database. The most striking issue is a 75.08% null rate across 354,770 rows, meaning only about one quarter of records carry an OSM linkage. Despite 88,395 unique values against ~88,693 non-null rows, the near-unique cardinality and platykurtic distribution (kurtosis \u2248 -1.23) are consistent with IDs drawn broadly across OSM's ID space (min ~1.3M, max ~13.5B), with no outliers detected.","role":"foreign_key","scope":"column","target":"osm_id","treatment":"Left-join on this id to OSM data after filtering or imputing the 75.08% nulls; investigate whether missingness is systematic before joining."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","top_value","top_rate","top_values","n"],"model":"anthropic:default","narrative":"This column records the data provider or attribution source for each row, with only 4 distinct values drawn from named external datasets (OpenStreetMap contributors, The Megalithic Portal, NOAA Storm Events Database, OpenStreetMap). The most striking signal is a 51.56% null rate \u2014 meaning over half of all 354,770 rows carry no source attribution, which is a data quality concern for provenance tracking. The top value 'OpenStreetMap contributors' accounts for 51.44% of non-null rows (88,396 records), while the closely related 'OpenStreetMap' (8,656 records) suggests inconsistent attribution for the same upstream source.","role":"metadata","scope":"column","target":"source","treatment":"Consolidate 'OpenStreetMap contributors' and 'OpenStreetMap' into a single category, investigate and impute or flag the 51.56% nulls before using as a stratification or filter variable."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","top_value","top_rate","n_unique","entropy","top_values","n"],"model":"anthropic:default","narrative":"This column captures country of origin or residence, using a mix of ISO 2-letter codes and full-name variants. The most alarming issue is a 55.29% null rate, meaning over half of 354,770 rows carry no country value. Compounding this, 'USA' and 'US' are effectively the same country but stored as two distinct values (86,583 and 60,634 respectively), together accounting for ~54.6% of non-null records \u2014 indicating inconsistent data entry that inflates apparent cardinality. There are also 9,497 empty-string records that escaped null detection, and the distribution is heavily US-dominated with 28 unique values at low entropy (1.34).","role":"feature","scope":"column","target":"country","treatment":"Unify 'USA'/'US' and other aliases into ISO-3166 codes, convert empty strings to null, then impute or flag remaining nulls before using as a categorical feature."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","top_value","top_rate","cardinality","top_values","n"],"model":"anthropic:default","narrative":"This column contains US state abbreviations (and possibly territories or non-standard codes given 118 unique values vs. the expected 50\u201360), making it a geographic categorical feature. The most critical signal is a 58.5% null rate, meaning over half the 354,770 rows have no state recorded \u2014 a severe data quality issue. The top value is 'TX' at 8.6% of non-null rows, with CA and FL following; the 118-cardinality (nearly double the 50 US states) suggests the presence of territories, foreign country codes, or dirty values worth auditing.","role":"feature","scope":"column","target":"state","treatment":"Audit the 118 unique values to identify non-US-state codes, impute or flag nulls (58.5% missing), then encode as categorical for modelling."},{"confidence":"high","critiques":[],"evidence_keys":["column","kind","null_rate","top_rate","top_value","top_values","n","entropy_ratio","cardinality"],"model":"anthropic:default","narrative":"This column represents a count of fatalities per incident, stored as a categorical type despite being inherently numeric. The null rate is severe at 75.59%, meaning only ~86,313 of 354,770 rows have a value. Among non-null rows, 92.86% record zero fatalities, with a long tail reaching at least 10; the low entropy ratio (0.088) confirms extreme concentration at '0'.","role":"feature","scope":"column","target":"fatalities","treatment":"Cast to integer, investigate and impute or exclude the 75.59% nulls, then treat as a heavily zero-inflated count variable (consider zero-inflated Poisson or log1p transform for regression)."},{"confidence":"medium","critiques":[],"evidence_keys":["null_rate","top_value","top_rate","cardinality","entropy","entropy_ratio","n","top_values"],"model":"anthropic:default","narrative":"This column records injury counts per incident, stored as a categorical type despite being numeric in nature \u2014 values are integers ('0', '1', '2', \u2026) with a cardinality of 233 distinct values. The null rate is severely high at 75.59%, meaning only ~86,827 of 354,770 rows have a recorded value, which is flagged as an alert. Among non-null rows, 85.4% report zero injuries, producing a heavily right-skewed distribution with low entropy (1.23, entropy ratio 0.157). The presence of 233 distinct values suggests some entries may encode ranges, text annotations, or data-entry anomalies beyond simple integers.","role":"feature","scope":"column","target":"injuries","treatment":"Cast to numeric, investigate nulls (MCAR vs. structural zero), treat missing as unknown rather than zero, then consider zero-inflated or count-based model treatment."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","top_value","top_rate","n","n_unique","cardinality","entropy_ratio","top_values"],"model":"anthropic:default","narrative":"This column represents a magnitude scale (likely seismic, stellar, or similar physical measurement) stored as a categorical type despite being fundamentally numeric \u2014 values include integers (0, 1, 2, 3, 4) and decimals (4.5, 4.6, 4.7, 1.75). The null rate of 76.7% is alarming and triggered an alert, meaning over three-quarters of the 354,770 rows carry no value. An additional surprise is the presence of '-9', which appears 1,278 times and is almost certainly a sentinel/missing-value code rather than a true measurement. The top value '0' dominates non-null records at 44.4% of non-null observations, and entropy_ratio of 0.31 confirms a heavily skewed, low-diversity distribution despite 294 unique string representations.","role":"feature","scope":"column","target":"magnitude","treatment":"Cast to float after replacing '-9' with NaN, investigate the 76.7% null rate for systematic missingness, then consider log-transform or binning before modelling."},{"confidence":"medium","critiques":[],"evidence_keys":["null_rate","top_value","top_rate","n_unique","entropy_ratio","top_values","kind"],"model":"anthropic:default","narrative":"This column represents the width of some geographic or physical feature measured in yards, stored as a categorical type despite being numeric in nature. Nearly 80% of values are null (null_rate = 0.7976), making missingness the dominant signal. Among the 71,493 non-null records, values are round numbers (10, 50, 100, 30, 20, 200\u2026) suggesting manual or estimated entries rather than precise measurements. The top value '10' accounts for 20.2% of non-null rows, and with 437 unique values and an entropy ratio of 0.51, the distribution is moderately concentrated.","role":"feature","scope":"column","target":"width_yards","treatment":"Cast to numeric, investigate whether nulls are structurally missing (feature absent) or simply unrecorded before imputing or dropping; log-transform or bin for modelling given round-number clustering."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_value","top_rate","top_values","cardinality"],"model":"anthropic:default","narrative":"This column captures the reported shape of UFO/unidentified aerial phenomena sightings, with 28 distinct categories such as 'light', 'triangle', 'circle', and 'fireball'. The most striking issue is an 82.91% null rate across 354,770 rows, meaning only ~60,600 records have a shape value at all. Among non-null records, 'light' dominates at 21.27%, and the presence of catch-all categories like 'unknown' (4,359) and 'other' (4,209) further dilutes the informativeness of the non-missing data.","role":"feature","scope":"column","target":"shape","treatment":"Impute or flag nulls as a separate 'not_reported' category before encoding; consider consolidating 'unknown' and 'other' with nulls given ambiguity."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_value","top_rate","cardinality","entropy_ratio","top_values"],"model":"anthropic:default","narrative":"This column contains meteorite classification codes (e.g., 'L6', 'H5', 'CM2'), representing standard petrologic-type designations for chondrite and other meteorite classes. The most striking feature is an extremely high null rate of 90.93%, meaning only roughly 32,000 of 354,770 rows carry a classification. Among classified records the distribution is moderately concentrated \u2014 'L6' alone accounts for 20.3% of non-null values \u2014 with 395 distinct classes and an entropy ratio of ~0.51, indicating moderate spread across the taxonomy.","role":"label","scope":"column","target":"meteorite_class","treatment":"Impute nulls with an explicit 'Unknown' category or exclude from supervised models; encode via target or ordinal encoding given 395 classes and severe class imbalance."},{"confidence":"low","critiques":[],"evidence_keys":["column","alerts","n","null_rate","n_unique","stats","kind"],"model":"anthropic:default","narrative":"This column contains abandoned-reason codes or labels \u2014 likely a categorical field recording why a record, transaction, or session was abandoned. The profiler emitted a 'skipped' alert with no stats or uniqueness counts, meaning the column's type could not be resolved and no frequency analysis was performed. With 354,770 non-null rows and a null rate of exactly 0.0, the field is fully populated, but its true cardinality, distribution, and value content are entirely unknown from this evidence.","role":"label","scope":"column","target":"abandoned_reason","treatment":"Re-profile with explicit string/categorical typing to recover value counts and cardinality before any downstream use."},{"confidence":"low","critiques":[],"evidence_keys":["column","n","null_rate","alerts","stats"],"model":"anthropic:default","narrative":"This column records elevation in metres for 354,770 rows with no nulls. The profiler emitted a 'skipped' alert and returned no computed statistics, so distribution shape, range, skew, and uniqueness are entirely unknown from this evidence. The name strongly implies a continuous numeric geographic feature, but no further characterisation can be made without re-running profiling.","role":"feature","scope":"column","target":"elevation_m","treatment":"Re-profile to obtain range, skew, and outlier metrics; then consider log-transform or clipping if heavily right-skewed before use in modelling."},{"confidence":"low","critiques":[],"evidence_keys":["column","n","null_rate","alerts"],"model":"anthropic:default","narrative":"The column 'mass_g' likely represents mass measurements in grams across 354,770 records, with zero nulls indicating complete data coverage. No distributional statistics are available \u2014 the profiler skipped this column \u2014 so skew, range, outliers, and uniqueness cannot be assessed from the evidence provided.","role":"feature","scope":"column","target":"mass_g","treatment":"Re-profile to obtain distribution stats; then check for skew and consider log-transform before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","mean","median","iqr","skew","n_outliers","outlier_rate","null_rate","n_unique"],"model":"anthropic:default","narrative":"This column contains geographic longitude values for 354,770 records, spanning the full valid range from -179.28\u00b0 to 180\u00b0. The distribution is moderately right-skewed (skew = 0.755) with a mean of -31.75\u00b0 and median of -42.66\u00b0, indicating a concentration of records in the Western Hemisphere (Americas/Atlantic). The IQR of 104.81\u00b0 is extremely wide, suggesting genuinely global coverage rather than a region-specific dataset, and only 827 values (0.23%) are flagged as outliers.","role":"feature","scope":"column","target":"longitude","treatment":"Pair with latitude for geospatial modelling; consider coordinate binning or haversine-based features rather than treating as a raw numeric."},{"confidence":"high","critiques":[],"evidence_keys":["cardinality","n_unique","null_rate","top_value","top_rate","entropy","entropy_ratio","top_values"],"model":"anthropic:default","narrative":"This column is a data-source/event-type label drawn from 14 distinct categories across 354,770 rows with zero nulls. The categories span scientific datasets (NOAA tornadoes, NASA meteorites, OSM features) and paranormal/anomalous phenomena (UFO sightings, Bigfoot, haunted places, megalithic portal), suggesting this is a multi-source 'strange phenomena' aggregation dataset. Distribution is moderately uneven \u2014 the top value 'noaa_tornadoes' holds 20.2% of rows (71,813), while 'bigfoot_sightings' has only 3,797 \u2014 but entropy of 2.99 against a ratio of 0.78 indicates reasonable spread across classes. No nulls and clean cardinality make this an immediately usable stratification variable.","role":"label","scope":"column","target":"category","treatment":"Use as a stratification or grouping key; one-hot encode or target-encode for modelling."}],"providers":["anthropic:default"],"total_usage":{"completion_tokens":7442,"prompt_tokens":33851,"total_tokens":41293}},"language_counts":{"als":1,"ar":15,"az":6,"ba":13,"be":23,"ca":55,"ceb":5,"cs":14,"cy":8,"da":38,"de":258,"el":8,"en":8310,"es":158,"eu":29,"fi":7,"fr":285,"hr":5,"hu":24,"id":18,"it":240,"ja":7,"ko":1,"la":1,"nl":30,"no":13,"pl":30,"pt":36,"ro":9,"ru":111,"sk":10,"sl":2,"sv":17,"tr":7,"tt":1,"uk":13},"meta":{"generated_at":"2026-06-22T01:08:51+00:00","mode":"full","row_count":354770,"sampled_rows":354770,"seed":42,"source":"/home/coolhand/html/datavis/data_trove/data/quirky/strange_places_v5.2.json"},"notes":[],"saturn_version":"0.2.0","schema":{"abandoned_reason":"unknown","abandoned_year":"categorical","access":"categorical","cargo":"categorical","category":"categorical","cave_depth_m":"categorical","cave_length_m":"categorical","cave_ref":"text","cave_type":"categorical","city":"text","country":"categorical","damage_property":"text","date":"text","depth_km":"numeric","description":"text","duration_seconds":"numeric","earthquake_type":"categorical","elevation_m":"unknown","energy_joules":"categorical","event_type":"categorical","fall_type":"categorical","fatalities":"categorical","former_population":"categorical","heritage":"categorical","injuries":"categorical","last_eruption":"categorical","latitude":"numeric","length_miles":"text","longitude":"numeric","magnitude":"categorical","mass_g":"unknown","meteorite_class":"categorical","name":"text","osm_id":"numeric","osm_type":"categorical","peak_brightness_altitude_km":"categorical","place":"text","place_type":"categorical","shape":"categorical","source":"categorical","state":"categorical","status":"categorical","temperature":"categorical","type":"categorical","velocity_km_s":"categorical","vessel_type":"categorical","volcano_type":"categorical","width_yards":"categorical"}}
