{"columns":[{"alerts":[{"code":"near_unique","level":"info","message":"98.7% of rows are unique strings"}],"column":"name","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[170,475,487,304,3551,425,71,34,16,12,10,5,3,0,1,1,1,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1],"edges":[2.0,5.775,9.55,13.325,17.1,20.875,24.65,28.425,32.2,35.975,39.75,43.525,47.3,51.074999999999996,54.85,58.625,62.4,66.175,69.95,73.725,77.5,81.27499999999999,85.05,88.825,92.6,96.375,100.14999999999999,103.925,107.7,111.475,115.25,119.02499999999999,122.8,126.575,130.35,134.125,137.9,141.67499999999998,145.45,149.225,153.0]},"near_unique":true,"sample":["Nordland","Probable USMC Landing Craft","Ship Wreck","Shipwreck 1183795103","Shipwreck 6653835473","Port Werburgh Concrete Barge","Shipwreck 7075573076","Shipwreck 1387382577","\u0416\u0435\u043b\u0435\u0437\u043e\u0431\u0435\u0442\u043e\u043d\u043d\u043e\u0435 \u0441\u0443\u0434\u043d\u043e \u0442\u0438\u043f\u0430 \"\u0412\u0438\u043a\u0438\u043d\u0433\"","U-869 (Wrack)","P.S. Agnes","Shipwreck 9598789175","Shipwreck 3145392410","Mohegan","Relitto mercantile \"San Francesco di Catone\"","Shipwreck 2818717153","Shipwreck 1156299208","Shipwreck 1251357233","Shipwreck 1454027318","Shipwreck 6516222059","Shipwreck 3145392563","City of Grand Rapids (steamer)","Shipwreck 2351011959","Wrak Botter","Shipwreck 385126926","Shipwreck 978789211","Shipwreck 10538093267","Shipwreck 2901729585","Shipwreck 803699391","Shipwreck 1392845451","SS Goolgwai","USS Amesbury (bow)","Shipwreck 49457720","Shipwreck 6122110223","Zenobia Shipwreck","Queen","Shipwreck 1389423819","Shipwreck 9236618763","Shipwreck 7290147686","Shipwreck 9528248000","Scheepswrak van Wierum","Shipwreck 1388382841","Shipwreck 3145392397","Shipwreck 1388382837","Shipwreck 1392258615","Shipwreck 1409348440","Ingar\u00f6 102","Shipwreck 6122110229","Panagia ship wreck","Shipwreck 1385762404"],"top_values":[],"top_words":[["shipwreck",3706],["wreck",96],["ss",90],["(wrack)",57],["of",54],["uss",42],["the",39],["barge",36],["maru",33],["hms",30],["de",24],["mv",23],["le",19],["ii",18],["wrack",18],["concrete",18],["boat",17],["s.s.",16],["(wreck)",16],["city",16],["lcm",16],["port",15],["ship",15],["relitto",14],["werburgh",14]],"vocab_skipped":null,"word_histogram":{"counts":[576,4399,0,351,0,172,38,0,19,0,8,1,0,1,0,1,1,0,1,0,0,0,0,0,0,0,0,0,0,1],"edges":[1.0,1.6,2.2,2.8,3.4,4.0,4.6,5.2,5.8,6.3999999999999995,7.0,7.6,8.2,8.8,9.4,10.0,10.6,11.2,11.799999999999999,12.4,13.0,13.6,14.2,14.799999999999999,15.399999999999999,16.0,16.6,17.2,17.8,18.4,19.0]}},"kind":"text","n":5569,"n_null":0,"n_unique":5497,"null_rate":0.0,"stats":{"allcaps_rate":0.017238283354282635,"boilerplate_rate":0.0,"duplicate_rate":0.012928712515711977,"emoji_rate":0.0,"len_max":153,"len_mean":17.812713233973785,"len_median":20.0,"len_min":2,"len_p95":21.0,"n_duplicates":72,"n_empty":0,"one_word_rate":0.10342970012569581,"readability_flesch_mean":71.32877500000001,"url_rate":0.0,"vocab_size":6255,"word_mean":2.072903573352487,"word_median":2.0}},{"alerts":[],"column":"lat","extras":{"histogram":{"counts":[1,0,0,1,1,20,39,41,50,107,235,110,55,117,67,28,30,72,73,67,39,180,104,80,106,84,74,140,470,734,578,466,668,332,185,77,98,34,5,1],"edges":[-77.4249898,-73.43508664500001,-69.44518349,-65.455280335,-61.465377180000004,-57.475474025000004,-53.485570870000004,-49.495667715,-45.50576456,-41.515861405,-37.52595825,-33.536055095,-29.54615194,-25.556248785,-21.56634563,-17.576442475,-13.58653932,-9.596636164999993,-5.606733009999999,-1.616829855000006,2.3730733000000015,6.362976455000009,10.352879610000002,14.342782764999995,18.332685920000003,22.32258907500001,26.312492230000004,30.302395384999997,34.292298540000004,38.28220169500001,42.272104850000005,46.262008005,50.251911160000006,54.24181431500001,58.23171747000002,62.221620625,66.21152378000001,70.20142693500001,74.19133009,78.181233245,82.1711364]},"sample":[48.2808606,12.3201688,54.433522,54.267833,-34.8104698,52.5939644,12.171676,48.417403,12.0260699,24.45,25.06667,41.8228833,41.945,44.9113,44.1388028,43.9316667,44.3127,45.2678,51.4499857,51.487933,50.7425,50.6427777,4.099112,55.7688333,54.187952,43.006409,-51.6897236,48.166123,-35.2924604,-41.3768771,-36.7663206,12.6227502,23.8292123,-43.5801068,54.565315,54.5620144,54.6345175,54.6089903,54.5800162,54.5797851,54.5857931,54.5520572,47.3687095,-33.1068353,21.587664,30.2312064,54.323864,-33.6269093,57.375242,-50.508895,44.2639435,51.7227267,-22.8367789,-22.961575,-23.1516852,-29.5724137,-17.6953423,-0.4514926,-0.4918309,32.3636114,-1.4144565,-3.7021756,-3.7111638,-4.6999956,-4.8356891,-9.6745726,-16.8867305,31.2987869,-25.4913616,59.8561111,-30.5636747,-31.2961502,-33.3448493,-21.697704,48.0643068,47.5145026,54.1689632,6.3975029,6.4211472,6.4224358,-22.8832447,-22.871332,-23.9940826,48.7057607,43.5266013,59.4844392,-32.0136111,33.9805038,34.0072312,-32.9093766,-32.9244202,-34.2494161,-34.2505403,-34.2510221,-34.2462498,-34.5578444,-34.1196992,-30.8024359,-29.3104145,-12.9093796,-12.119809,-4.4213705,-5.3781067,46.72754,36.9139568,37.033119,37.8431693,37.9084072,38.0261556,38.0755347,38.1265945,38.1497279,38.2175893,38.2335104,38.2835899,38.6686127,38.6764687,40.0175588,40.1403128,40.1745781,40.3607607,40.5175102,40.6832415,40.6845509,40.7565471,40.7923536,40.8086074,41.2256808,41.247008,41.4159767,41.8610446,42.1511538,42.1816658,42.2307299,43.074609,43.1091799,43.1537507,43.2309616,43.2623675,43.474896,43.4785951,43.6750902,43.7031296,43.7860428,43.8090618,43.8208925,43.950694,44.1106997,44.225916,44.229759,44.2662849,44.3172591,44.3229432,44.3753504,44.392289,45.3641334,45.4690863,-31.9193204,18.7920584,21.5147534,46.983458,47.0826803,46.3004177,65.125126,44.6961192,54.2892167,54.45595,35.9643127,36.016902,19.9606915,59.2938444,-36.7232604,46.5294801,-19.1541883,44.2172222,-5.3358275,47.9657675,56.1668079,22.4974291,49.0249421,-32.0027389,59.3113971,44.6239281,51.0781942,51.0592707,60.6307667,46.068889,15.7213052,54.1652078,69.1923249,30.5254206,30.5268785,30.5270634,30.5273268,30.5283872,30.5284612,68.0517272,63.916667,55.6,57.35,32.6742831,38.0978298,60.2113594,-25.068671,41.4215648,56.5201927,45.2675776,45.2981468,50.3799142,50.3579127,50.355013,17.7347284,35.5088968,-21.9106537,37.8072514,30.3833336,16.7447521,59.7930923,60.0293451,-43.6287152,57.7827336,46.756219,-6.164787,57.6529185,38.9814838,54.1623193,10.4739433,39.091627,10.4851966,42.6933591,-51.8698012,50.2039422,59.4480702,59.5032072,-36.7686088,-36.7701366,72.794786,-32.4691348,43.7644181,10.3063374,10.3055978,37.5151789,52.5868573,49.4492839,29.5145068,47.8677379,50.9141809,11.2612893,36.7257233,14.7742361,50.5488378,-21.096,-41.3911035,-41.3530001,-41.6721667,-38.0710723,-43.3500002,-43.4648772,-40.5300897,-35.7339152,-29.9408804,-38.5695891,13.7296327,40.68,40.468,50.9056869,12.1219794,5.9601269,38.3439432,-32.1005389,35.4474874,-33.1503701,-22.1826215,-22.1833629,36.8849241,38.1695329,68.3900962,-32.0955562,-36.4044642,46.8310166,25.4447988,51.6457603,-21.8899426,-51.6941508,-34.3078694,22.5058152,0.1672464,46.3165388,10.2944077,46.8943008,40.680695,41.5416667,54.4900862,36.9230624,25.3718924,39.092562,55.3838483,40.572291,49.0475821,54.6122829,51.4998165,47.6098666,37.7437477,52.4734323,38.4341748,9.6579527,32.8665373,55.6982073,53.4671095,-34.0263688,42.2366126,30.2290232,9.35183,8.74088,55.0637502,39.7556217,37.9477273,8.84838,8.7488,8.74028,8.73013,32.3616925,8.77823,8.84538,8.75166,8.76181,8.77528,46.1872623,53.8336342,12.4438643,36.3973064,-27.4559456,9.8252621,40.6428163,51.7309054,11.5934127,60.8823504,29.2254402,47.5145458,11.2524209,20.8879198,21.3612805,51.5352539,35.2827393,40.5361122,40.5365508,28.2126048,41.9120855,48.5827269,48.8725004,-53.2197192,-34.2714685,42.1694461,69.647167,54.0968516,8.2816262,51.6955885,17.3576762,55.0527845,13.2654535,-16.5496003,44.5293863,39.0812595,-49.5522109,-12.1890215,51.2824355,-41.5108925,54.8986432,51.4158823,37.6996098,-40.7999642,52.3687912,35.048849,50.3954159,52.9592438,-27.1618672,46.9996007,-51.7217149,44.8955067,34.4330505,46.9346178,39.2081788,39.208224,47.4018635,37.7850917,37.7860475,37.7853518,40.5571481,40.5578732,60.3955432,60.3894062,24.7776374,42.9731323,-46.570205,-46.5759973,-45.8021119,-35.3078266,-33.1503887,47.7728867,47.7741058,47.7750667,47.7740864,47.7738556,44.9158953,51.8867033,5.9171233,64.5783195,-0.6242843,68.0670701,71.9822853,69.3804267,50.6847382,53.4195139,36.7226918,65.1573759,41.9110463,41.959668,-8.6686246,18.1161589,50.6530784,16.4004168,13.4624082,39.4595628,40.5581378,69.3904091,69.3909936,69.4167341,41.8149143,-27.2619712,43.5479967,-33.8148018,-32.9137386,48.0906926,58.1529312,17.7497023,53.8714681,53.9239249,53.8312063,-36.8307548,-4.9113773,41.7347546,38.0779495,38.0784813,38.0771143,38.0336806,38.0555781,38.0554537,43.3369665,40.6449441,40.6437392,40.6444104,40.6445678,40.6445649,40.6444765,40.6445642,40.6447,40.6450144,40.6439478,40.6439801,40.6438206,40.6435843,40.6431067,40.6423872,40.6418583,40.6384639,40.6386191,40.6395623,40.6383857,40.6381941,40.6382464,38.6701129,43.5231677,48.6010082,48.6011296,48.5992672,51.4061905,51.406252,51.3809234,51.3804428,51.3768472,51.4109847,51.4194477,51.4194968,51.4104357,51.4052253,51.4101388,51.4127286,51.412835,54.6221654,45.9058524,-20.6518445,51.3870331,59.7012397,-13.8248507,51.735551,51.7734921,51.7336275,51.7333419,32.3535843,24.5845259]},"kind":"numeric","n":5569,"n_null":0,"n_unique":5561,"null_rate":0.0,"stats":{"iqr":37.821963000000004,"kurtosis":0.08299029751430265,"max":82.1711364,"mean":28.41433878021189,"median":40.6434862,"min":-77.4249898,"n_outliers":112,"outlier_rate":0.02011133057999641,"q1":12.5355236,"q3":50.3574866,"skew":-1.1358408577236159,"std":31.35537549818393,"zero_rate":0.0}},{"alerts":[{"code":"outliers","level":"warn","message":"9.7% rows beyond 1.5 IQR"}],"column":"lon","extras":{"histogram":{"counts":[54,17,7,5,4,15,266,15,3,39,161,520,163,211,146,157,39,25,98,586,539,923,302,239,86,100,61,8,31,7,7,23,34,44,48,44,109,69,163,201],"edges":[-179.2833333,-170.315068185,-161.34680307000002,-152.378537955,-143.41027284,-134.442007725,-125.47374261000002,-116.50547749500001,-107.53721238000001,-98.56894726500002,-89.60068215000001,-80.63241703500002,-71.66415192000002,-62.695886805000015,-53.72762169000002,-44.75935657500003,-35.79109146000002,-26.82282634500001,-17.85456123000003,-8.886296115000022,0.08196899999998664,9.050234114999967,18.018499229999975,26.986764344999983,35.95502945999996,44.92329457499997,53.89155968999998,62.85982480499999,71.82808991999997,80.79635503499995,89.76462014999996,98.73288526499996,107.70115037999997,116.66941549499998,125.63768060999999,134.605945725,143.57421083999995,152.54247595499996,161.51074106999997,170.47900618499997,179.4472713]},"sample":[-4.5945667,122.5033517,11.322611,13.945067,138.5416398,7.2840668,-68.2893863,-123.402219,-68.2515176,-81.7333,-80.31084,-82.5361639,-82.855,-80.1568611,-76.5845194,-76.7366667,-73.3081826,-81.7149972,-9.4614034,-9.493483,-0.0138888,-0.1286111,73.400468,10.698333,21.655981,6.0841597,-57.8790537,-16.2,173.1613657,174.8683817,174.8740612,-8.0257385,35.808667,-142.720271,-0.5961416,-0.6061899,-0.8890944,-0.6899242,-0.5387463,-0.5387416,-0.7841805,-0.6253391,-70.4042464,138.0282252,-81.5849518,-87.9308259,12.361615,151.1647989,-5.5268994,166.171997,15.9381355,157.9747719,-43.1051592,-43.0597584,-43.7196315,-49.4962044,-38.9888715,-47.8811026,-47.0771732,-64.9135213,-48.5037055,-38.4878508,-38.5274812,-36.7213946,-37.1141079,-35.7124763,-38.917089,32.3393576,-48.290327,10.5944444,-50.3747896,-50.8996682,-52.5986873,-57.8922818,-88.3233462,-89.1979561,12.1399814,3.3702583,3.5107693,3.5547122,-43.1768552,-43.1309295,-46.3006046,-125.0070774,16.4211527,24.7116135,115.5414806,-120.2332333,-119.4085395,-60.6746923,-60.6598227,-58.7141653,-58.7093078,-58.707226,-58.7271001,-57.6151478,-58.3327919,-51.3044284,-49.693645,-38.4934625,-37.6636585,-37.7576828,-35.2543068,-2.41823,15.1816243,14.2313643,15.6539967,15.9571653,13.7659284,14.1872447,13.5222821,12.60438,15.3198588,15.6121831,15.7671291,13.7132774,15.3900164,16.6732156,17.8080228,17.9061066,14.9799334,18.2069825,18.0156167,17.9714494,14.0973194,17.6225681,17.6084399,16.7282994,9.4654888,16.1918801,12.1781117,11.7235733,11.5691266,14.9208124,10.3134639,10.4389869,13.913941,13.7838309,14.0774394,13.7340231,10.0518255,13.3062336,10.2767387,10.2167678,7.909425,7.8898719,9.9013834,8.397578,8.4221895,9.4734189,9.3330893,9.1269573,9.2268334,8.9911169,8.8883033,12.4454944,12.5836292,152.4557841,53.2588635,-87.360859,-2.4912558,-2.4544963,59.4801937,25.0270718,14.3699073,14.0405667,13.6831833,14.3337455,14.2862962,-75.993528,18.4215611,-73.0938864,36.1555547,146.8681711,8.4680556,72.2672923,-4.1020967,-5.5552021,-78.8183807,140.2606243,115.5573389,18.4553092,-63.5393365,2.5006799,2.423578,4.8469896,-5.784444,39.9477696,23.9070226,33.375982,47.8360364,47.8388473,47.8388473,47.8433937,47.842412,47.8421733,-99.2259521,0.4,-1.4,-1.65,-117.1731815,-122.850729,19.3192955,-130.095087,-70.9432337,-5.9531263,59.3207001,59.3351036,-4.1936375,-4.1058838,-4.1117986,105.1520871,23.5668725,165.7552256,-122.42986,-179.2833333,-22.8932595,21.0158714,20.9029442,172.6834605,45.6212237,60.7134968,155.6336648,-3.6219478,23.017684,15.5517206,-67.9873289,-119.9542736,-67.8246771,17.7010046,-58.250486,-3.7238868,24.7893408,24.6213562,174.8777462,174.8797399,-56.1082509,142.3859966,-69.781383,-109.2003634,-109.200352,23.3974813,21.448653,-123.330204,34.9270007,-3.3525728,-1.4760718,-15.7538024,26.919711,120.249947,-3.237351,-175.1904,174.7899563,174.7800001,174.8221667,174.7568129,172.9999321,173.199447,173.1640062,174.6918158,-71.3344662,-58.6488427,-60.9721116,23.735,22.8285,-1.3842804,-68.943725,80.7194106,15.2201867,-60.6470599,-120.9189766,18.0842513,166.4162354,166.4173472,27.1567574,-76.0901839,14.4122495,115.7586465,174.1083329,138.4423497,-80.1192183,-4.2483315,153.6607477,-57.8023968,18.4018744,91.698488,117.467518,-1.0478693,-109.2223621,-56.3340271,-8.6326079,-70.8777778,-0.5993292,3.8905843,-170.568415,23.0669474,-5.7932617,8.300181,3.0364416,18.5123114,30.5864843,-2.7680178,-25.626209,1.7167583,-74.7644854,-82.7556887,139.1997306,37.6744257,6.2667802,123.2418396,12.5093287,122.7586335,167.44186,167.71691,-1.449112,-74.0998869,23.5658986,167.74083,167.68783,167.7229,167.72235,-64.9141105,167.72611,167.73961,167.68396,167.66831,167.71188,-123.0979904,-79.0062282,-61.4972025,-6.2043699,-58.8198536,169.3055589,-74.1679433,0.6903247,92.2123352,30.6370098,50.2983336,-89.1973714,124.9911439,-17.0570711,-17.026327,46.0895553,-3.1227886,-74.2471186,-74.2471238,-177.3704698,-73.987005,-2.0016602,2.7730466,-70.9395709,-58.8350763,130.2668871,18.8075946,81.4633855,-78.8457912,-8.5496313,-62.8499406,-162.3294806,-88.5482634,11.6710448,-1.2575901,-84.8487255,69.8213569,44.2877404,30.2205953,-72.9983393,-1.4605654,30.093966,24.2847568,-62.9972626,5.1529539,-78.8581542,-125.9587111,158.7062701,153.3678616,-85.1092537,-61.3000574,-86.07366,40.9856629,31.9593613,-76.5760841,-76.575641,-122.4652689,-122.2500199,-122.2519726,-122.2540524,-74.2172798,-74.2152789,11.2341548,11.2515554,141.2919251,17.22665,168.3171496,168.3096007,170.6274308,174.1257689,18.0842658,-3.2988491,-3.2960196,-3.2960999,-3.2950689,-3.2935005,10.6152552,-8.3233761,10.1589897,40.4749277,73.1016144,39.4967836,102.4627272,86.2141245,156.1831212,-9.8774483,5.5567245,37.1119161,-73.9963203,-73.9603969,13.4152883,-62.9811334,156.1244971,39.1920297,144.6353577,-75.5240788,-74.2145975,33.1582213,33.1558918,33.1371015,-71.3928049,153.1071192,-79.5756043,151.2244422,151.7972777,-4.3339051,11.420737,-64.6967759,-166.5440315,-166.508369,-166.6116551,174.8903318,115.6540767,-49.9431156,-121.9564621,-122.022875,-122.0240199,-122.1252954,-121.8391351,-121.8391745,-124.1945364,-74.173693,-74.1693019,-74.1645331,-74.1641274,-74.1634312,-74.1619939,-74.1620382,-74.1621938,-74.1616112,-74.162112,-74.1616559,-74.1613398,-74.1628886,-74.1577191,-74.1575119,-74.1573669,-74.1532635,-74.1545243,-74.1543901,-74.1494389,-74.1500231,-74.1497843,-9.0087634,-1.4967039,-2.0051021,-2.0048979,-2.0077475,0.5956627,0.5800705,0.6301674,0.6310261,0.6275529,0.6979969,0.7057842,0.7066458,0.7317046,0.5499232,0.557879,0.5690146,0.571044,13.2265423,-64.6240816,116.4470134,0.5114027,10.596345,-172.0184723,0.6905186,0.898495,0.686484,0.6864409,-64.7105538,-81.8191513]},"kind":"numeric","n":5569,"n_null":0,"n_unique":5568,"null_rate":0.0,"stats":{"iqr":80.728115,"kurtosis":0.2435224882443583,"max":179.4472713,"mean":1.413148562847908,"median":2.033333,"min":-179.2833333,"n_outliers":542,"outlier_rate":0.09732447477105405,"q1":-58.596951,"q3":22.131164,"skew":0.5273027069818278,"std":76.7538304665523,"zero_rate":0.0}},{"alerts":[{"code":"long_tail","level":"info","message":"35 singleton categories"},{"code":"null_rate","level":"warn","message":"99.3% null"}],"column":"year_sunk","extras":{"singletons":35,"top_values":[["1942",2],["30 June 1890",1],["1854",1],["1971",1],["1937-09-02",1],["1963-02",1],["1643..1663",1],["1982",1],["June 7, 1928",1],["1435",1],["1920-12-16",1],["1490s",1],["~1700",1],["20 April 1943",1],["25 May 1963",1],["1710",1],["1915",1],["1909",1],["1951",1],["1952",1]]},"kind":"categorical","n":5569,"n_null":5532,"n_unique":36,"null_rate":0.9933560782905368,"stats":{"cardinality":36,"entropy":5.155399311574898,"entropy_ratio":0.9971903480488863,"top_rate":0.05405405405405406,"top_value":"1942"}},{"alerts":[{"code":"long_tail","level":"info","message":"17 singleton categories"}],"column":"type","extras":{"singletons":17,"top_values":[["shipwreck",5081],["ship",381],["barge",27],["submarine",18],["aircraft",17],["plane",10],["boat",4],["vehicle",3],["motor_vehicle",3],["schooner",2],["car",2],["sailboat",2],["battleship",2],["steamer",1],["airplane",1],["freightcar",1],["train",1],["paddle steamer",1],["motorbike",1],["helicopter",1]]},"kind":"categorical","n":5569,"n_null":0,"n_unique":30,"null_rate":0.0,"stats":{"cardinality":30,"entropy":0.5649690531607278,"entropy_ratio":0.1151378947935692,"top_rate":0.91237205961573,"top_value":"shipwreck"}},{"alerts":[{"code":"long_tail","level":"info","message":"303 singleton categories"},{"code":"null_rate","level":"warn","message":"94.4% null"}],"column":"wikipedia","extras":{"singletons":303,"top_values":[["en:SS Edmund Fitzgerald",4],["fr:Armorique (navire)",2],["en:Curtiss C-46 Commando",2],["en:USS Amesbury",2],["en:SS America (1939)",1],["ar:\u0633\u0641\u064a\u0646\u0629 \u0632\u064a\u0633\u062a\u0644 \u062c\u0648\u0631\u0645",1],["en:BOS 400",1],["en:New Carissa",1],["en:MV Cita",1],["en:SS Richard Montgomery",1],["en:Kroombit Tops National Park#Crash site",1],["en:Astron (ship)",1],["en:SS Yongala",1],["et:Raketa (laev, 1949)",1],["en:USNS General Hoyt S. Vandenberg (T-AGM-10)",1],["en:USS Oriskany (CV-34)",1],["en:USS Massachusetts (BB-2)",1],["en:Water Witch (schooner)",1],["en:Burlington Bay Horse Ferry",1],["en:Champlain II",1]]},"kind":"categorical","n":5569,"n_null":5256,"n_unique":307,"null_rate":0.9437960136469743,"stats":{"cardinality":307,"entropy":8.245290412427826,"entropy_ratio":0.9979660808479136,"top_rate":0.012779552715654952,"top_value":"en:SS Edmund Fitzgerald"}},{"alerts":[{"code":"long_tail","level":"info","message":"347 singleton categories"},{"code":"null_rate","level":"warn","message":"93.5% null"}],"column":"wikidata","extras":{"singletons":347,"top_values":[["Q1286267",4],["Q959696",2],["Q215692",2],["Q2862787",2],["Q1145708",2],["Q11675753",2],["Q463091",1],["Q32276",1],["Q115709756",1],["Q14213801",1],["Q2877353",1],["Q7006376",1],["Q6719379",1],["Q41771616",1],["Q7394285",1],["Q7420193",1],["Q1359321",1],["Q4811601",1],["Q1424289",1],["Q1618842",1]]},"kind":"categorical","n":5569,"n_null":5208,"n_unique":353,"null_rate":0.935176871969833,"stats":{"cardinality":353,"entropy":8.445993531042296,"entropy_ratio":0.9979286593320096,"top_rate":0.0110803324099723,"top_value":"Q1286267"}},{"alerts":[{"code":"long_tail","level":"info","message":"269 singleton categories"},{"code":"null_rate","level":"warn","message":"93.9% null"}],"column":"description","extras":{"singletons":269,"top_values":[["WWII era concrete fuel barge converted into breakwater",14],["Wrecks",7],["WWII concrete barge sunk as part of jetty, partially covered by jetty and fill",5],["Location is based on divers hand drawn maps. Due to the wreak breaking up and salvage, the wreak is scattered over a large area.",4],["Partially sunken ships",4],["Concrete petrol barge sunk as part of breakwater",4],["Wrecks of Zulu fishing boats",3],["Chaloupe abandonn\u00e9e \u00e0 terre",3],["WWII era concrete fuel barge sunk as part of jetty foundation",3],["Armada Ship",2],["remains of sunken wooden boats",2],["Hundido el 3 de julio de 1898 durante la batalla naval de Santiago de Cuba en la Guerra Hispano-Cubana-Norteamericana.",2],["09/09/2006 : Epave en bois, longue de 20 m\u00e8tres, large de 4 m\u00e8tres et haute de 3 m\u00e8tres.",2],["Steamer",2],["Iron-hulled barque",2],["On shore wreck of a small abandoned wooden ship.",2],["\u00c9pave",2],["Doj\u015bcie do wrak\u00f3w w zasadzie wolne. Jednak mog\u0105 wyst\u0105pi\u0107 sytuacje gdy b\u0119dzie to utrudnione lub niemo\u017cliwe.",2],["Wrecked sealing vessel",2],["Staten Island boat graveyard",2]]},"kind":"categorical","n":5569,"n_null":5227,"n_unique":291,"null_rate":0.9385886155503681,"stats":{"cardinality":291,"entropy":7.982680712710059,"entropy_ratio":0.9752965534932168,"top_rate":0.04093567251461988,"top_value":"WWII era concrete fuel barge converted into breakwater"}},{"alerts":[{"code":"long_tail","level":"info","message":"3 singleton categories"},{"code":"null_rate","level":"warn","message":"99.8% null"}],"column":"heritage","extras":{"singletons":3,"top_values":[["2",10],["no",1],["yes",1],["1",1]]},"kind":"categorical","n":5569,"n_null":5556,"n_unique":4,"null_rate":0.9976656491291076,"stats":{"cardinality":4,"entropy":1.1451104143815827,"entropy_ratio":0.5725552071907913,"top_rate":0.7692307692307693,"top_value":"2"}},{"alerts":[{"code":"null_rate","level":"warn","message":"90.9% null"}],"column":"access","extras":{"singletons":1,"top_values":[["yes",340],["no",73],["permit",27],["private",27],["unknown",20],["permissive",17],["customers",3],["foot",1]]},"kind":"categorical","n":5569,"n_null":5061,"n_unique":8,"null_rate":0.9087807505835878,"stats":{"cardinality":8,"entropy":1.6491288720023753,"entropy_ratio":0.5497096240007918,"top_rate":0.6692913385826772,"top_value":"yes"}},{"alerts":[{"code":"long_tail","level":"info","message":"120 singleton categories"},{"code":"null_rate","level":"warn","message":"96.3% null"}],"column":"depth","extras":{"singletons":120,"top_values":[["7",6],["30m",4],["16",4],["14",4],["8",4],["10",4],["25m",3],["12.2",3],["15.6",3],["15",3],["4",3],["5",3],["6.1",2],["-0.3",2],["97",2],["11",2],["6.4",2],["42",2],["18",2],["3",2]]},"kind":"categorical","n":5569,"n_null":5361,"n_unique":154,"null_rate":0.962650386065721,"stats":{"cardinality":154,"entropy":7.084867121904036,"entropy_ratio":0.9749656305752077,"top_rate":0.028846153846153848,"top_value":"7"}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 98.4% of rows"}],"column":"seamark_type","extras":{"singletons":5,"top_values":[["wreck",5026],["hulk",56],["shoreline_construction",14],["obstruction",7],["harbour",2],["restricted_area",1],["plane",1],["beacon_special_purpose",1],["landmark",1],["no",1]]},"kind":"categorical","n":5569,"n_null":459,"n_unique":10,"null_rate":0.08242054228766385,"stats":{"cardinality":10,"entropy":0.14771497753641039,"entropy_ratio":0.0444666390472907,"top_rate":0.9835616438356164,"top_value":"wreck"}},{"alerts":[],"column":"osm_id","extras":{"histogram":{"counts":[261,442,361,685,726,181,136,46,213,623,44,45,55,29,53,45,27,86,55,174,59,45,39,32,70,50,55,182,56,63,27,35,62,37,67,82,56,105,123,37],"edges":[13059633.0,351124299.7,689188966.4,1027253633.0999999,1365318299.8,1703382966.5,2041447633.1999998,2379512299.9,2717576966.6,3055641633.2999997,3393706300.0,3731770966.7,4069835633.3999996,4407900300.099999,4745964966.8,5084029633.5,5422094300.2,5760158966.9,6098223633.599999,6436288300.3,6774352967.0,7112417633.7,7450482300.4,7788546967.099999,8126611633.799999,8464676300.5,8802740967.199999,9140805633.9,9478870300.6,9816934967.3,10154999634.0,10493064300.699999,10831128967.4,11169193634.1,11507258300.8,11845322967.5,12183387634.199999,12521452300.9,12859516967.6,13197581634.3,13535646301.0]},"sample":[278946664.0,285876338.0,296860179.0,330613715.0,477206052.0,614225073.0,635094207.0,663869274.0,663869397.0,663869444.0,663869445.0,663869463.0,663869464.0,663869487.0,663869502.0,663869508.0,663869523.0,663869539.0,663869559.0,663869562.0,663869593.0,663869596.0,663869943.0,663870667.0,663871171.0,686686503.0,828692526.0,1033930279.0,1036801823.0,1036801921.0,1036801969.0,1044201328.0,1068558027.0,1112841934.0,1156298941.0,1156298960.0,1156298978.0,1156298979.0,1156298993.0,1156299243.0,1156299392.0,1156299431.0,1209334135.0,1280115312.0,1612247647.0,1651680734.0,1816855365.0,1829616408.0,1856290216.0,1866606319.0,1921636298.0,1958145333.0,1971472609.0,1971502194.0,1976150008.0,1983994091.0,1985469079.0,1986434277.0,1986434278.0,1987095906.0,1990608807.0,1998240417.0,1998245427.0,1998246279.0,1998246785.0,2063545285.0,2069828598.0,2076573418.0,2097749374.0,2100341313.0,2118489095.0,2118492565.0,2118509054.0,2124092373.0,2171721457.0,2171804358.0,2202986326.0,2247300112.0,2247300142.0,2247300144.0,2341493539.0,2351011959.0,2351445222.0,2452316961.0,2641130377.0,2675393508.0,2774072522.0,2780229546.0,2780236171.0,2804943012.0,2804943013.0,2806465163.0,2806465167.0,2806465168.0,2806465805.0,2818716897.0,2818717704.0,2901724952.0,2903410562.0,2917544819.0,2918108991.0,2921307111.0,2921310587.0,2937595459.0,3145391433.0,3145391441.0,3145391487.0,3145391494.0,3145391511.0,3145391516.0,3145391629.0,3145391632.0,3145391647.0,3145391649.0,3145391667.0,3145391688.0,3145391689.0,3145391857.0,3145391865.0,3145391869.0,3145391881.0,3145391892.0,3145391909.0,3145391910.0,3145391914.0,3145391917.0,3145391920.0,3145392348.0,3145392354.0,3145392368.0,3145392392.0,3145392409.0,3145392413.0,3145392415.0,3145392455.0,3145392456.0,3145392462.0,3145392464.0,3145392467.0,3145392480.0,3145392481.0,3145392492.0,3145392494.0,3145392502.0,3145392506.0,3145392509.0,3145392521.0,3145392541.0,3145392557.0,3145392558.0,3145392565.0,3145392581.0,3145392583.0,3145392598.0,3145392601.0,3145392613.0,3145392615.0,3259236075.0,3277599852.0,3282509807.0,3505886354.0,3517684772.0,3730868933.0,3740075175.0,3754259627.0,3842202408.0,4115922125.0,4158241012.0,4159831402.0,4288699090.0,4306897693.0,4400524441.0,4407793704.0,4737428511.0,4843147743.0,5194716720.0,5241743235.0,5247799169.0,5468668203.0,5732837822.0,5792018092.0,5849369397.0,5896532312.0,5960721367.0,5960741385.0,6046352459.0,6348076018.0,6373710606.0,6411515859.0,6516222059.0,6516228509.0,6516228515.0,6516228517.0,6516228529.0,6516228535.0,6516228544.0,6516940269.0,6516967674.0,6516967680.0,6516967681.0,6518067885.0,6534579072.0,6537057108.0,6561291060.0,6566512233.0,6611083341.0,6727097513.0,6727106627.0,6735631679.0,6735892071.0,6735892072.0,6760873685.0,6765515060.0,6801427799.0,6816353567.0,6853566394.0,6888399085.0,6898595658.0,6932761706.0,6946537859.0,7061902026.0,7067463585.0,7071671947.0,7079569734.0,7169799136.0,7191787778.0,7217314074.0,7259522813.0,7572843808.0,7644014050.0,7978479319.0,8063221454.0,8150781994.0,8150916775.0,8165913416.0,8165918122.0,8269538920.0,8385748617.0,8406154571.0,8407002982.0,8407002983.0,8412500724.0,8491098870.0,8526894453.0,8577535117.0,8600109482.0,8767262717.0,8841823266.0,8956871627.0,9172205761.0,9180376729.0,9222907371.0,9231686990.0,9231686991.0,9231686999.0,9234532504.0,9236468457.0,9236468459.0,9236801066.0,9236894297.0,9324991714.0,9352814315.0,9385639518.0,9456262934.0,9473834112.0,9482845440.0,9483157443.0,9504129497.0,9534546574.0,9566536422.0,9634679149.0,9664779302.0,9760841768.0,9760841769.0,9786622189.0,9864254502.0,9885211699.0,9939223415.0,10593558285.0,10671590750.0,10683545810.0,10941834163.0,10946879100.0,11025669642.0,11051586533.0,11080357004.0,11247284079.0,11638275098.0,11653327635.0,11818501865.0,11838662526.0,11980577311.0,12043402674.0,12059551182.0,12077684865.0,12095294294.0,12100356677.0,12104977842.0,12136435470.0,12136641599.0,12147375501.0,12155275036.0,12212941611.0,12346514495.0,12394538541.0,12406733026.0,12560660564.0,12643951311.0,12734232035.0,12765452189.0,12794083532.0,12798881320.0,12845238695.0,12845245610.0,12900577329.0,12968541384.0,12973869298.0,12978817093.0,12978817100.0,12981269112.0,12981590916.0,12994775215.0,13041027821.0,13041027823.0,13041027831.0,13042348292.0,13042348296.0,13078433004.0,13143549663.0,13456923901.0,13507802401.0,13510887663.0,13535646301.0,22703043.0,98480581.0,120523928.0,172035281.0,179013381.0,207061421.0,245986620.0,251454856.0,251499932.0,304322264.0,311238820.0,314664253.0,314664254.0,384027964.0,385126930.0,421135689.0,425640312.0,502672949.0,528537917.0,534592956.0,537970750.0,612725450.0,671346243.0,678902578.0,685046544.0,705882204.0,706493548.0,736926283.0,745715403.0,759192765.0,772738733.0,777203069.0,778403829.0,779476862.0,779944491.0,782148445.0,783470678.0,785954872.0,802545579.0,803108830.0,817763094.0,839638668.0,846865410.0,847727579.0,855572475.0,879058566.0,886882038.0,893805514.0,911811355.0,911811356.0,932309121.0,934451205.0,934451213.0,934451223.0,972635323.0,972635326.0,986372037.0,986392661.0,995900860.0,998823689.0,1000657627.0,1000657632.0,1000657635.0,1000690899.0,1014952084.0,1035843191.0,1035843207.0,1035843214.0,1035843220.0,1035843231.0,1045130196.0,1063155190.0,1066433756.0,1075467832.0,1078103255.0,1079348293.0,1080440781.0,1080470592.0,1088932307.0,1164275160.0,1172492655.0,1179955214.0,1181405237.0,1181442371.0,1188945041.0,1213406210.0,1221807094.0,1236406710.0,1245790079.0,1251357231.0,1282083609.0,1282734130.0,1282734136.0,1282734143.0,1304349259.0,1304519127.0,1304570821.0,1311003541.0,1311010579.0,1318890629.0,1319915607.0,1320186215.0,1331259925.0,1331527765.0,1332783516.0,1347741175.0,1359297629.0,1378195703.0,1387113186.0,1387113195.0,1387113202.0,1387382560.0,1387382568.0,1387382569.0,1387614540.0,1387937286.0,1388101935.0,1388101945.0,1388120545.0,1388120566.0,1388302490.0,1388302491.0,1388302493.0,1388302499.0,1388302503.0,1388302505.0,1388302506.0,1388382847.0,1388436247.0,1388580797.0,1388580798.0,1388897593.0,1388897606.0,1388897608.0,1389423811.0,1389423818.0,1389423820.0,1391747353.0,1391875017.0,1391964080.0,1391964082.0,1391964095.0,1391993116.0,1392192971.0,1392258617.0,1392258618.0,1392258625.0,1392258650.0,1392258651.0,1392258653.0,1392258664.0,1392436460.0,1392436474.0,1392845458.0,1408932064.0,1413239543.0,1414931947.0,1426092530.0,1426405463.0,1435737729.0,1451297275.0,1453976990.0,1454274262.0,1454276595.0,1454276600.0,1458391822.0,1459203058.0]},"kind":"numeric","n":5569,"n_null":0,"n_unique":5569,"null_rate":0.0,"stats":{"iqr":5334868954.0,"kurtosis":-0.2044279866769072,"max":13535646301.0,"mean":4031676969.3336325,"median":2348528796.0,"min":13059633.0,"n_outliers":0,"outlier_rate":0.0,"q1":1181359593.0,"q3":6516228547.0,"skew":1.070579639039944,"std":3874691689.936448,"zero_rate":0.0}},{"alerts":[],"column":"osm_type","extras":{"singletons":0,"top_values":[["node",3656],["way",1913]]},"kind":"categorical","n":5569,"n_null":0,"n_unique":2,"null_rate":0.0,"stats":{"cardinality":2,"entropy":0.9281367891827335,"entropy_ratio":0.9281367891827335,"top_rate":0.656491291075597,"top_value":"node"}}],"insights":{"errors":[],"insights":[{"confidence":"high","critiques":[],"evidence_keys":["row_count","column_count","seamark_type.top_rate","type.top_rate","lon.min","lon.max","lat.min","lat.max","heritage.null_rate","year_sunk.null_rate","depth.null_rate","wikipedia.null_rate","osm_type.top_rate"],"featured_charts":[{"caption":"Longitude spans the full globe; look for clusters along major shipping lanes and coastlines.","column":"lon","kind":"histogram"},{"caption":"Latitude skews toward the northern hemisphere (median ~40.6\u00b0), reflecting denser mapping there.","column":"lat","kind":"histogram"},{"caption":"Almost everything is tagged 'wreck' (98%); the small slice of hulks and other types is the only variation.","column":"seamark_type","kind":"donut"},{"caption":"Confirms the shipwreck dominance, with a long tail of barges, submarines, and aircraft worth isolating.","column":"type","kind":"bar"},{"caption":"Roughly two-thirds are point nodes and one-third are ways (polygons/lines), which affects how each wreck should be rendered.","column":"osm_type","kind":"donut"}],"model":"anthropic:claude-opus-4-7","narrative":"This dataset catalogues 5,569 shipwrecks (and a handful of related features) sourced from OpenStreetMap, with 14 columns covering geography (lat/lon), OSM identifiers, type classifications, and optional metadata like depth, year sunk, and Wikipedia links. The collection is overwhelmingly homogeneous in category: 'wreck' accounts for 98.4% of seamark_type and 'shipwreck' for 91.2% of type, so the interesting variation lives elsewhere. Geographic spread is global \u2014 longitude ranges from -179.28 to 179.45 and latitude from -77.42 to 82.17 \u2014 making the lat/lon distribution the most informative view. Be aware that descriptive fields are largely empty: heritage is 99.8% null, year_sunk 99.3% null, depth 96.3% null, and Wikipedia/Wikidata links are missing for ~94% of records, so any analysis beyond location and basic typing will be working with a small subset.","scope":"dataset","target":"__global__"},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","stats.len_mean","stats.len_max","stats.word_median","stats.duplicate_rate","stats.n_duplicates","top_words","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds short text labels for individual records, almost certainly vessel or wreck names: 5,497 of 5,569 values are unique, mean length is 17.8 characters with a median of 2 words, and the dominant token \"shipwreck\" appears 3,706 times alongside nautical prefixes like \"ss\", \"uss\", and \"hms\". Despite the near_unique alert, there are 72 duplicates (1.3%) worth inspecting, and the recurring \"shipwreck\"/\"(wrack)\" tokens suggest names follow a templated pattern rather than being free prose.","role":"identifier","scope":"column","target":"name","treatment":"Treat as a name identifier; strip boilerplate tokens like \"shipwreck\" before any text matching, and do not use as a model feature."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","mean","median","skew","n","n_unique","null_rate","q1","q3"],"model":"anthropic:claude-opus-4-7","narrative":"This is a latitude feature spanning -77.42 to 82.17, covering nearly the full geographic range from Antarctica to the high Arctic. The distribution is left-skewed (skew -1.14) with a median of 40.64 well above the mean of 28.41, suggesting a concentration of points in northern mid-latitudes with a tail of southern hemisphere observations. With 5561 unique values across 5569 rows and no nulls, each record carries a near-distinct coordinate.","role":"feature","scope":"column","target":"lat","treatment":"Pair with the matching longitude column for geospatial features rather than using as a standalone scalar."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","median","mean","skew","iqr","n_unique","n","null_rate","n_outliers","outlier_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds longitude coordinates, with values ranging from -179.28 to 179.45 spanning the full globe and 5568 unique values across 5569 rows. The distribution is mildly right-skewed (0.53) with a median of 2.03 sitting near the prime meridian, and the IQR of 80.73 suggests broad geographic coverage. The flagged 542 outliers (9.7%) likely reflect points in the Pacific tails rather than data errors, given valid lon bounds.","role":"feature","scope":"column","target":"lon","treatment":"Pair with latitude as a geospatial feature; avoid treating outliers as anomalies since extremes are valid longitudes."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.entropy_ratio","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column records the year (or fuller date) a vessel sank, but it's almost entirely empty \u2014 99.34% null with only 36 distinct values across 5569 rows. Date formats are inconsistent: bare years like '1942' and '1435', ISO strings like '1937-09-02', verbose forms like 'June 7, 1928', and even ranges like '1643..1663' coexist. Entropy ratio of 0.997 confirms the few populated values are nearly all unique, with '1942' the only repeat (2 occurrences).","role":"metadata","scope":"column","target":"year_sunk","treatment":"Parse to a normalized year integer and treat as sparse metadata; too null-heavy to use as a feature."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Categorical type label for each record, dominated overwhelmingly by maritime wreckage: 'shipwreck' accounts for 5081 of 5569 rows (91.2% top_rate) with 30 distinct values total. Entropy ratio of 0.115 confirms the long_tail alert \u2014 the remaining 29 categories split fewer than 500 rows, with several near-synonyms ('ship'/'boat'/'schooner', 'aircraft'/'plane', 'vehicle'/'motor_vehicle') suggesting inconsistent labelling that could be consolidated.","role":"label","scope":"column","target":"type","treatment":"Collapse synonymous categories and consider binarising as shipwreck-vs-other given the extreme imbalance."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds Wikipedia article references prefixed with a language code (e.g., 'en:SS Edmund Fitzgerald', 'fr:Armorique (navire)', 'ar:...'), likely linking each record to an encyclopedia entry about a ship, aircraft, or wreck. It is overwhelmingly sparse \u2014 94.38% null with only 307 distinct values across 5569 rows \u2014 and the distribution is nearly flat (entropy ratio 0.998, top value appears just 4 times, top_rate 1.28%). The presence of multiple language prefixes (en, fr, ar) signals a mixed-language reference field rather than a clean categorical.","role":"metadata","scope":"column","target":"wikipedia","treatment":"Treat as an optional external reference link; drop for modelling or split off the language prefix if needed."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","top_value","top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds Wikidata Q-identifiers (e.g., Q1286267), linking rows to entities in the Wikidata knowledge graph. It is overwhelmingly sparse \u2014 93.52% null \u2014 and among the 5569 rows only 353 unique values appear, with the most common identifier showing up just 4 times (top_rate 0.011). Entropy ratio of 0.998 confirms the non-null values are nearly all distinct, consistent with a foreign key rather than a categorical feature.","role":"foreign_key","scope":"column","target":"wikidata","treatment":"Left-join on this id to enrich with Wikidata attributes; do not use as a model feature directly."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text descriptive notes about wrecks, barges, and other maritime features, populated for only ~6% of rows (null_rate 0.9386). Among the 342 non-null entries there are 291 distinct strings with entropy_ratio 0.975, so values are nearly all unique short narratives; the modal phrase 'WWII era concrete fuel barge converted into breakwater' appears just 14 times (top_rate 0.041). Mixed languages are present (e.g., French 'Chaloupe abandonn\u00e9e \u00e0 terre' alongside English), confirming this is curator-authored prose rather than a controlled vocabulary.","role":"free_text","scope":"column","target":"description","treatment":"Treat as sparse free text; tokenize/embed for search or keyword extraction rather than using as a categorical feature."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","top_values","stats.top_rate","stats.cardinality"],"model":"anthropic:claude-opus-4-7","narrative":"A categorical 'heritage' field that is effectively empty: 99.77% null, with only 13 non-null values across 4 distinct levels. The observed values are inconsistent ('2', '1', 'yes', 'no'), suggesting a coding scheme that was never standardized or fully populated.","role":"metadata","scope":"column","target":"heritage","treatment":"Drop; null_rate of 0.9977 leaves too little signal and the value coding is inconsistent."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This is an OpenStreetMap-style 'access' tag indicating who may use a feature, with values like 'yes', 'no', 'permit', 'private', 'permissive', 'customers', and 'foot'. It is overwhelmingly null (90.88%), and among the 508 populated rows 'yes' dominates at 66.93%, leaving the other 7 categories thinly represented. Cardinality is only 8 with entropy ratio 0.55, so signal beyond presence/absence is limited.","role":"metadata","scope":"column","target":"access","treatment":"Collapse rare levels and encode as a low-cardinality categorical, or reduce to a populated/'yes' indicator given the 90.88% null rate."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.cardinality","stats.entropy_ratio","stats.top_value","stats.top_rate","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"A free-text 'depth' field, almost certainly a measurement (likely meters) but stored as strings with mixed formats \u2014 bare numbers like '7', '16', '14' coexist with unit-suffixed values like '30m', '25m', and decimals like '12.2'. It is overwhelmingly missing (null_rate 0.9627) and extremely diffuse among the 208 populated rows: 154 unique values, top value '7' covers only 2.88%, and entropy_ratio 0.975 indicates a near-uniform long tail.","role":"feature","scope":"column","target":"depth","treatment":"Strip unit suffixes and parse to numeric meters; given >96% nulls, treat as low-signal and consider dropping or flagging presence only."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Categorical seamark classification with 10 distinct values, almost entirely dominated by 'wreck' at 98.36% of non-null rows (5026 of 5569). The remaining categories are extreme long-tail (hulk at 56, then single-digit counts down to one), and 8.24% of rows are null. Entropy ratio of 0.044 confirms the column carries almost no discriminative signal.","role":"feature","scope":"column","target":"seamark_type","treatment":"Drop or collapse to a binary 'is_wreck' flag; near-constant."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.skew","stats.zero_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This is almost certainly the OpenStreetMap object id: every one of the 5569 rows is unique, no nulls, no zeros, and values span 13M to 13.5B which matches OSM's monotonically growing id space. The distribution is right-skewed (skew 1.07) with mean 4.03B well above the median 2.35B, reflecting OSM's accumulation of newer, higher ids over time rather than anything analytically meaningful.","role":"identifier","scope":"column","target":"osm_id","treatment":"Drop from modelling; retain as a join key to OSM source data."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column records the OpenStreetMap geometry type for each row, taking only two values: \"node\" (3656 rows, 65.6%) and \"way\" (1913 rows). With cardinality 2 and entropy ratio 0.928, the split is fairly balanced but tilted toward nodes, and there are no nulls across all 5569 rows.","role":"feature","scope":"column","target":"osm_type","treatment":"Encode as a binary indicator (node vs way) for modelling."}],"providers":["anthropic:claude-opus-4-7"],"total_usage":{"completion_tokens":4725,"prompt_tokens":16516,"total_tokens":21241}},"language_counts":{},"meta":{"generated_at":"2026-05-01T18:07:22+00:00","mode":"full","row_count":5569,"sampled_rows":5569,"seed":42,"source":"/home/coolhand/html/datavis/data_trove/data/quirky/shipwrecks.json"},"notes":[],"saturn_version":"0.2.0","schema":{"access":"categorical","depth":"categorical","description":"categorical","heritage":"categorical","lat":"numeric","lon":"numeric","name":"text","osm_id":"numeric","osm_type":"categorical","seamark_type":"categorical","type":"categorical","wikidata":"categorical","wikipedia":"categorical","year_sunk":"categorical"}}
