{"columns":[{"alerts":[],"column":"id","extras":{"histogram":{"counts":[592,1123,2360,1819,1497,1907,1345,1415,1806,1977,2439,1595,1710,2212,2764,1741,1236,1268,2153,1135,2343,1932,2060,1970,1451,1229,1689,1952,2902,1840,617,1370,1613,3298,1230,1741,1317,2065,1532,1471],"edges":[12788558.0,350869173.6,688949789.2,1027030404.8000001,1365111020.4,1703191636.0,2041272251.6000001,2379352867.2000003,2717433482.8,3055514098.4,3393594714.0,3731675329.6000004,4069755945.2000003,4407836560.8,4745917176.400001,5083997792.0,5422078407.6,5760159023.200001,6098239638.8,6436320254.400001,6774400870.0,7112481485.6,7450562101.200001,7788642716.8,8126723332.400001,8464803948.000001,8802884563.6,9140965179.2,9479045794.800001,9817126410.400002,10155207026.0,10493287641.6,10831368257.2,11169448872.800001,11507529488.400002,11845610104.0,12183690719.6,12521771335.2,12859851950.800001,13197932566.400002,13536013182.0]},"sample":[305229751.0,331313744.0,338886503.0,370303616.0,453195412.0,552300779.0,552328976.0,589066724.0,621411105.0,639909010.0,655156573.0,656269842.0,693165083.0,698816869.0,809948310.0,829613992.0,859511437.0,861256007.0,861256083.0,861256910.0,861257498.0,861257730.0,861257749.0,1003828286.0,1123061550.0,1140738247.0,1182867659.0,1183673749.0,1282591964.0,1312824946.0,1314308159.0,1332846572.0,1347556476.0,1360646176.0,1360647081.0,1370524120.0,1392918369.0,1410936551.0,1422418870.0,1429320068.0,1435836546.0,1451721335.0,1496373086.0,1507623711.0,1507738867.0,1539494224.0,1558662681.0,1677222231.0,1702926338.0,1702990150.0,1707541572.0,1711061682.0,1713943789.0,1747320101.0,1768209815.0,1780443630.0,1790709781.0,1793459410.0,1834591548.0,1843023086.0,1853451364.0,1893158793.0,1907087333.0,1910811735.0,1943790304.0,1982618594.0,1996919224.0,2007470510.0,2182431722.0,2184163781.0,2194722258.0,2195105277.0,2197188211.0,2207054389.0,2274803878.0,2275567578.0,2315704266.0,2361244870.0,2363156461.0,2369172224.0,2384887596.0,2388250860.0,2477122650.0,2489052207.0,2527207413.0,2530808908.0,2583460113.0,2592496032.0,2601640689.0,2668544168.0,2753415290.0,2757791806.0,2778226587.0,2814115866.0,2821304417.0,2835603003.0,2839648824.0,2839648830.0,2919249072.0,2930279793.0,2992033647.0,3020793773.0,3053200731.0,3067037871.0,3081083163.0,3116685274.0,3131771489.0,3190287569.0,3317129670.0,3367109161.0,3370270563.0,3434168904.0,3437148745.0,3446873488.0,3447339866.0,3470780202.0,3491951640.0,3496957441.0,3523220723.0,3553315271.0,3568840804.0,3615833795.0,3677315074.0,3715970634.0,3730668328.0,3733018203.0,3760627191.0,3788046090.0,3860096843.0,3915067499.0,3915317231.0,3917687382.0,3921399083.0,3960292022.0,3979347717.0,3979828703.0,3990602092.0,4048709313.0,4081927858.0,4088790236.0,4112767546.0,4155521414.0,4163237146.0,4201254773.0,4228360389.0,4280952340.0,4306457116.0,4313458021.0,4318870949.0,4325824307.0,4335554418.0,4340513806.0,4360378585.0,4388876647.0,4401195543.0,4411116124.0,4418503737.0,4461297784.0,4483053223.0,4493647081.0,4512686924.0,4555883668.0,4557096102.0,4557115882.0,4562079271.0,4568767502.0,4568994821.0,4585484492.0,4623628718.0,4656017672.0,4677116391.0,4685625076.0,4741358624.0,4794883662.0,4794883663.0,4829203941.0,4895165337.0,4904016145.0,4908755689.0,4927438169.0,4931383257.0,4935691973.0,4935721263.0,4935721270.0,4940955284.0,4986474847.0,5005046012.0,5052335658.0,5052590061.0,5161127671.0,5261909909.0,5308219930.0,5387441944.0,5436330821.0,5452342924.0,5464792527.0,5486287906.0,5559691970.0,5589760683.0,5606801294.0,5618216426.0,5622395003.0,5664659650.0,5809160989.0,5863716040.0,5873876123.0,5910433649.0,5915727243.0,5926587866.0,5936882715.0,5938205270.0,5940313382.0,5942777642.0,5947980844.0,5981770069.0,6019665851.0,6019879762.0,6041581992.0,6058462685.0,6117058289.0,6127818031.0,6147287815.0,6153125334.0,6175350469.0,6177426724.0,6180747344.0,6289856541.0,6306777111.0,6316326093.0,6347363421.0,6351707242.0,6354840185.0,6357009068.0,6357009373.0,6357009730.0,6357010161.0,6357010234.0,6368677023.0,6368677428.0,6368677436.0,6368677455.0,6422990018.0,6437778333.0,6597383443.0,6695903139.0,6763243943.0,6779291012.0,6815007320.0,6852375901.0,6875759283.0,6887266341.0,6904668726.0,6911907743.0,6937612770.0,6982810720.0,6985148596.0,6985376043.0,7007084676.0,7026776901.0,7027248566.0,7034418303.0,7069855801.0,7070364385.0,7076425883.0,7078683122.0,7078773515.0,7088120582.0,7114093526.0,7266257794.0,7284597353.0,7388517506.0,7391194958.0,7392991118.0,7398960312.0,7400002239.0,7410484467.0,7412091333.0,7453733137.0,7457339870.0,7473834444.0,7474408041.0,7488849573.0,7490553670.0,7498609445.0,7511782365.0,7589853864.0,7606781338.0,7611240024.0,7636235884.0,7636242637.0,7652739156.0,7680674123.0,7738251625.0,7782163151.0,7800364696.0,7807754681.0,7844057747.0,7885338123.0,7960981797.0,7976304474.0,8010399575.0,8026397819.0,8080892317.0,8091189850.0,8101928855.0,8174508417.0,8203854494.0,8320965738.0,8399880225.0,8409656698.0,8415638935.0,8432345382.0,8517719350.0,8560398166.0,8561502113.0,8562989281.0,8569617517.0,8651414882.0,8807314875.0,8830915014.0,8850759480.0,8965425805.0,8975166110.0,8983631709.0,8999648590.0,9002208010.0,9006190336.0,9006434551.0,9024995638.0,9032826068.0,9043618209.0,9046891346.0,9065700586.0,9114091196.0,9130347017.0,9176144233.0,9193270379.0,9203305710.0,9228962180.0,9232513736.0,9254701417.0,9276963132.0,9418254777.0,9433176931.0,9439801323.0,9440297671.0,9458557212.0,9458770516.0,9467879435.0,9502296298.0,9502304138.0,9521491964.0,9523833714.0,9524476817.0,9525050920.0,9525262072.0,9535295818.0,9535295824.0,9536461698.0,9557467044.0,9593486561.0,9655954004.0,9686606962.0,9723859221.0,9741436823.0,9782772114.0,9785375517.0,9792475154.0,9812479477.0,9881424933.0,9881483474.0,9905397224.0,9925123255.0,9974734399.0,9974785165.0,9991100058.0,9995541678.0,10011033076.0,10013359470.0,10088777517.0,10089915627.0,10124866843.0,10140433484.0,10143342794.0,10151865485.0,10177834052.0,10183952923.0,10223682782.0,10289297781.0,10315477111.0,10543642969.0,10553919281.0,10555097411.0,10555208743.0,10599939433.0,10602460747.0,10602460772.0,10612403750.0,10650338650.0,10655495439.0,10676276520.0,10753842577.0,10753847314.0,10754061621.0,10781275838.0,10858753640.0,10913985672.0,10915697933.0,10948652852.0,10962354402.0,10979237146.0,10989007282.0,11007061579.0,11057885734.0,11163966290.0,11164750035.0,11238809518.0,11267335752.0,11276934944.0,11300455154.0,11300503222.0,11300503229.0,11301436869.0,11307577078.0,11307577122.0,11307577504.0,11307577746.0,11307578068.0,11307578399.0,11307578633.0,11307578680.0,11307578838.0,11307578961.0,11307579036.0,11307579130.0,11307579137.0,11307579197.0,11463520067.0,11536435422.0,11653257202.0,11817165773.0,11871661551.0,11872615269.0,11887472521.0,11892229904.0,11898946403.0,11919448669.0,11943711932.0,11958245157.0,12002703535.0,12033604930.0,12048053672.0,12104359099.0,12127898023.0,12288216201.0,12297149699.0,12334471685.0,12405255524.0,12444182240.0,12475299569.0,12509033606.0,12509046869.0,12512128284.0,12598651015.0,12607093791.0,12607817098.0,12620334733.0,12625589781.0,12640412000.0,12641559902.0,12643752243.0,12663407810.0,12752808935.0,12768829533.0,12770501344.0,12825026738.0,12832977119.0,12833220906.0,12877454487.0,12915137764.0,12959145639.0,12970223956.0,13006095930.0,13018679381.0,13028257844.0,13043377591.0,13057614785.0,13067897927.0,13092431619.0,13119465674.0,13121432935.0,13180276901.0,13304672287.0,13323828204.0,13344311512.0,13354338420.0,13363694831.0,13437589993.0,13452729738.0,13456786205.0]},"kind":"numeric","n":69716,"n_null":0,"n_unique":69716,"null_rate":0.0,"stats":{"iqr":6338368332.75,"kurtosis":-1.1770278569443284,"max":13536013182.0,"mean":6841788293.420549,"median":7006519241.0,"min":12788558.0,"n_outliers":0,"outlier_rate":0.0,"q1":3609747458.25,"q3":9948115791.0,"skew":0.019549896755422534,"std":3774305020.5880184,"zero_rate":0.0}},{"alerts":[{"code":"duplicates","level":"warn","message":"35.1% duplicate strings"}],"column":"name","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[1601,3457,5854,31600,9877,8424,3274,2614,1175,885,482,175,154,56,45,17,11,3,2,2,4,2,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1],"edges":[1.0,4.55,8.1,11.649999999999999,15.2,18.75,22.299999999999997,25.849999999999998,29.4,32.95,36.5,40.05,43.599999999999994,47.15,50.699999999999996,54.25,57.8,61.349999999999994,64.9,68.45,72.0,75.55,79.1,82.64999999999999,86.19999999999999,89.75,93.3,96.85,100.39999999999999,103.94999999999999,107.5,111.05,114.6,118.14999999999999,121.69999999999999,125.25,128.8,132.35,135.9,139.45,143.0]},"near_unique":false,"sample":["Santa Marija Caves","Unnamed Cave","Ipogeo 7\u00b0 via Monti","Grotte des Vers Luisants","Unnamed Cave","Alibi 1. sz. barlang","skaln\u00ed byty","Unnamed Cave","Abisso B52","Cueva de la Torca 3 (corrales del trillo)","Grotta a SW del Zuc Torondo","Shpella e Kusarit","Unnamed Cave","Unnamed Cave","Korina pe\u0107ina","Grotta della Tana","Grotte du Diable","Buca degli antipodi","Duenicka pestera","Grotta di Bercovei","Unnamed Cave","Pozo del Compromiso","The Grotto","Grotte Petzl","Unnamed Cave","Cueva Galiana Alta","Lochbr\u00fccke","Unnamed Cave","Gelsenspalte","Unnamed Cave","L\u00edrhola","Unnamed Cave","Unnamed Cave","Unnamed Cave","Aven des Cabanelles","Unnamed Cave","Unnamed Cave","Banana Ground Sink #1","Chingwe's hole","Unnamed Cave","Priepas\u0165 pod H\u00e1jskou vyhliadkou","Cueva Leza 7","\u0411\u0430\u0445\u0430\u043b\u0432\u0430","\u063a\u0627\u0631 \u0633\u0646\u0651\u0648","Unnamed Cave","Cueva de Santo Adriano","Unnamed Cave","Unnamed Cave","Vatnshellir","Unnamed Cave"],"top_values":[["Unnamed Cave",19527],["\u0413\u0440\u043e\u0442",116],["Cave",58],["Grotte",56],["\u0433\u0440\u043e\u0442",46],["B\u00e4renh\u00f6hle",41],["Cueva",41],["Galleria WW1",34],["Aven",32],["Baume",32],["Grotta",31],["p\u0159evis",31],["Bat Cave",30],["Grotte des F\u00e9es",28],["Stollen",24],["Cueva del Agua",23],["Gouffre",23],["\u7a91\u6d1e",21],["Windloch",20],["Felsenkeller",19]],"top_words":[["cave",6494],["unnamed",5598],["de",2120],["del",1083],["grotta",1049],["la",844],["grotte",737],["di",719],["cueva",713],["cova",596],["buca",485],["du",449],["des",403],["aven",370],["della",291],["jama",192],["avenc",189],["pozzo",179],["dei",169],["sima",164],["delle",146],["trou",124],["2",120],["gouffre",119],["jaskinia",114]],"vocab_skipped":null,"word_histogram":{"counts":[10771,33141,0,13755,6940,0,2753,1375,0,582,237,0,93,44,0,12,7,0,1,2,0,1,1,0,0,0,0,0,0,1],"edges":[1.0,1.6666666666666665,2.333333333333333,3.0,3.6666666666666665,4.333333333333333,5.0,5.666666666666666,6.333333333333333,7.0,7.666666666666666,8.333333333333332,9.0,9.666666666666666,10.333333333333332,11.0,11.666666666666666,12.333333333333332,13.0,13.666666666666666,14.333333333333332,15.0,15.666666666666666,16.333333333333332,17.0,17.666666666666664,18.333333333333332,19.0,19.666666666666664,20.333333333333332,21.0]}},"kind":"text","n":69716,"n_null":0,"n_unique":45229,"null_rate":0.0,"stats":{"allcaps_rate":0.03241723564174651,"boilerplate_rate":0.0,"duplicate_rate":0.3512393137873659,"emoji_rate":1.4343909575994034e-05,"len_max":143,"len_mean":15.52237649893855,"len_median":13.0,"len_min":1,"len_p95":29.0,"n_duplicates":24487,"n_empty":0,"one_word_rate":0.15449825004303172,"readability_flesch_mean":55.50801250000002,"url_rate":0.0,"vocab_size":15219,"word_mean":2.519493373113776,"word_median":2.0}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=-3.16"},{"code":"outliers","level":"warn","message":"12.9% rows beyond 1.5 IQR"}],"column":"lat","extras":{"histogram":{"counts":[4,0,3,0,1,2,13,26,60,127,329,330,225,257,301,204,78,139,314,183,118,358,287,385,1856,937,775,1082,1231,3928,12068,20377,19250,2492,1075,564,267,47,19,4],"edges":[-77.9764944,-74.07253886250001,-70.168583325,-66.2646277875,-62.36067225000001,-58.456716712500004,-54.552761175,-50.648805637500004,-46.7448501,-42.8408945625,-38.936939025,-35.0329834875,-31.129027949999994,-27.225072412499998,-23.321116874999994,-19.417161337499998,-15.513205799999994,-11.609250262499998,-7.7052947249999875,-3.801339187499991,0.10261635000000524,4.006571887500016,7.910527425000012,11.814482962500009,15.718438500000019,19.622394037500015,23.526349575000012,27.430305112500008,31.33426065000002,35.238216187500015,39.14217172500001,43.04612726250002,46.95008280000002,50.854038337500015,54.75799387500001,58.66194941250001,62.56590495000003,66.46986048750003,70.37381602500002,74.27777156250002,78.1817271]},"sample":[27.9295291,40.5370456,15.1068892,29.2042945,44.8715389,50.4846914,54.1785191,51.3783093,57.2061428,40.2549211,57.2048794,50.6625768,50.3957429,44.0433361,50.8566644,49.7782421,44.0522522,43.2836631,43.2679579,43.3529851,43.2800302,43.4159346,43.3205625,44.8702411,-38.913012,47.9588018,12.2231708,48.013249,47.746115,44.3143024,57.4203963,48.852834,43.9416528,45.926493,45.9602596,45.8702272,46.7598016,47.6395281,47.8911631,47.7277071,50.8868035,45.561437,55.9385386,56.1457855,56.1218827,16.0531314,57.7205428,55.164679,38.9968542,38.9956062,43.7456792,44.8762355,45.6125983,50.6845782,45.9188,43.3358025,47.8210147,48.323342,-0.6391406,40.975906,47.615015,-41.2045623,44.3488706,11.4299411,48.374934,28.3582683,44.8999458,47.8373029,43.302231,48.1431852,48.0814412,45.7652513,7.5592645,48.0424947,45.695452,44.3425062,45.6080957,48.4892926,44.2391076,39.7000867,24.2099373,46.4752418,37.7010735,49.5190231,45.842297,54.9982512,45.8682449,41.638916,-3.8796365,28.6239871,48.0061636,47.974825,43.3333727,41.8580131,43.3442122,45.6167134,44.1983193,44.4214616,51.5635965,50.7568077,40.0653185,44.256012,29.2070887,50.2222231,48.6813391,49.8716642,47.7559671,47.315095,44.3068157,47.2542279,47.0105537,40.6531694,48.09366,47.96396,48.084895,47.74546,48.5679786,47.9915519,48.4610392,24.7301669,49.2527042,46.6571882,47.7560049,43.713443,43.3513115,43.9931618,42.806867,50.1625503,35.0044443,47.8366128,43.5385322,66.8199413,32.7540108,42.560143,-33.1117697,38.799046,45.8123402,43.4658982,47.9493986,50.9075168,39.8476991,44.0112674,48.9228682,47.654048,49.61117,48.572757,31.7028826,46.3557299,47.7836681,43.3479718,47.7826486,37.697582,47.7604959,46.0792562,44.2990984,46.1557093,48.7522778,45.687631,47.7311563,34.2702901,48.8605064,43.2319073,43.382971,43.3989849,49.7601625,43.350395,43.3612255,37.6893413,40.081503,38.7375267,41.674963,41.3066201,40.1993369,42.7865326,42.7862966,37.4407591,43.6726633,60.493162,42.2913235,41.6636444,42.7614887,44.0807359,44.2232336,44.2195588,42.8861277,44.1793572,42.6673128,50.8943234,50.8943504,17.994505,47.135776,40.8007406,45.6873135,24.1785673,57.3300325,40.2191734,37.2742282,44.9671617,47.7424241,41.7399933,42.1181726,41.4302015,52.8567669,47.7245756,42.1458278,45.4086752,52.7648931,37.2475087,51.7897851,8.2455406,49.1392537,47.7200825,45.4206971,39.5104894,50.5756169,28.2586092,44.2353497,53.0663913,21.3172731,45.7620104,45.4083592,43.5935483,48.7110825,48.7506702,34.6693077,50.057701,47.5276431,31.7151602,25.2756896,39.5171305,39.7509175,27.3036602,39.566992,39.5438531,39.663264,39.5489832,39.5249311,39.549878,39.8365401,39.5041231,39.557014,41.7533352,50.7846509,30.2182221,44.0934656,47.7118152,43.1804956,47.7207633,47.600586,43.5225193,45.9327874,42.345812,44.2403777,4.9266637,38.8580378,28.307153,48.9493953,39.8671139,17.8842865,17.8754722,18.3614265,17.7422794,18.0900567,18.1189183,18.1669462,18.177307,45.605862,43.3318087,43.6517501,49.3833773,25.3275109,-34.129325,44.0215878,45.7077885,54.1881178,45.791728,47.7184154,43.22687,43.7844813,43.7001207,25.6448928,43.0636354,50.6732889,60.7928889,42.7802212,44.0598918,37.7038142,40.7464968,47.1475756,47.1485693,47.1648211,40.0038035,46.3332701,48.9932263,43.5722336,-5.2257626,-4.4537963,33.5068345,44.4733996,41.3489504,46.0593893,49.1646785,45.1961361,43.5700191,35.451162,44.5953892,43.3476271,38.8580601,42.978708,45.7448032,43.7788491,37.0033215,37.9078518,44.7422986,41.0897227,37.6890735,44.2512209,29.0187655,49.2477639,47.7002788,45.7661204,44.926509,45.8329696,44.1541786,45.2987245,43.5383579,56.8544325,43.3242219,44.2525922,37.7767225,40.4716313,44.2487726,40.4069338,47.4849249,33.0497582,40.1742995,47.8863879,50.48454,47.9151172,44.7115538,20.7234353,42.609568,43.8557192,44.3145972,40.3680228,41.6793961,37.1952537,47.0750659,47.9055338,48.2693361,48.2689774,47.3840299,48.5105156,45.5216547,47.3060969,47.2822834,47.5865209,47.5850227,38.8992334,43.2072853,7.3012787,44.9399281,43.9095012,47.6705458,41.6676337,22.5499302,45.1564942,40.1499691,49.057581,46.1147313,46.1144738,45.2403189,32.0764457,46.09317,45.8885497,50.798858,45.4525836,-34.8036235,52.2985624,48.6052339,40.2596657,43.1222861,37.5490266,41.8324458,41.7763022,39.8483576,45.7404627,49.485665,43.9886585,44.5788543,47.966714,33.2198171,48.4177032,48.4855272,45.8960263,45.6698242,45.6927333,50.5098868,50.2128351,28.9157936,38.9261292,40.1444822,48.3648547,30.6131555,48.5163643,40.0183166,41.142928,23.9477649,32.2846965,48.6913979,45.395279,48.6252627,48.6514441,38.9402974,54.1858892,40.542229,40.1259588,38.6920658,49.1767716,44.1166957,44.0639601,44.064006,39.5465076,42.9542442,44.1125642,44.0783233,43.0774934,44.0071287,42.9872315,43.9750898,44.0655216,42.7753578,44.038795,44.078888,44.0455625,42.4623157,44.1102669,47.14945,43.257021,46.1331679,40.3395658,42.169942,42.2212147,44.388827,42.7923644,36.923215,39.8129032,32.8821363,44.6373458,35.431311,40.1351717,42.4658476,41.9651706,25.0171275,49.8045419,45.5631583,42.5988125,48.5770462,-51.6087209,40.66074,44.7522742,34.9578242,20.6868198,49.0859181,45.9900401,50.2421418,41.6827343,50.5093323,47.8626362,48.6047404,43.9185304,50.8589506,45.8662642,40.0737755,36.7049556,48.481563,49.7036911,45.1194615,46.2213102,40.0245653,31.7778677,52.1343679,32.7664364,46.3311762,54.2140833,42.7279471,45.2757977,-37.4214483,45.7127309,40.7446231,46.9411716,24.9891353,40.7664051,37.1321228,38.9536376,48.2780003,48.2819984,47.8510044,43.0559208,38.5276322]},"kind":"numeric","n":69716,"n_null":0,"n_unique":69544,"null_rate":0.0,"stats":{"iqr":7.255502175000004,"kurtosis":11.499182025079556,"max":78.1817271,"mean":40.58213393029147,"median":44.14308795,"min":-77.9764944,"n_outliers":8996,"outlier_rate":0.1290378105456423,"q1":40.49452245,"q3":47.750024625,"skew":-3.160679959391871,"std":15.475569597429715,"zero_rate":0.0}},{"alerts":[{"code":"outliers","level":"warn","message":"16.2% rows beyond 1.5 IQR"}],"column":"lon","extras":{"histogram":{"counts":[54,6,49,20,6,18,352,454,283,361,579,1877,236,168,252,203,26,182,766,9279,14696,22468,8156,1754,1346,530,479,150,381,210,212,1114,956,696,395,363,330,46,33,230],"edges":[-178.0045299,-169.0844669775,-160.164404055,-151.24434113249998,-142.32427821,-133.4042152875,-124.484152365,-115.5640894425,-106.64402652,-97.7239635975,-88.803900675,-79.8838377525,-70.96377483,-62.0437119075,-53.123648985,-44.203586062499994,-35.28352314,-26.363460217500005,-17.44339729500001,-8.523334372499988,0.39672855000000595,9.3167914725,18.236854394999995,27.15691731749999,36.07698023999998,44.997043162500006,53.917106085,62.837169007499995,71.75723192999999,80.67729485250001,89.597357775,98.5174206975,107.43748362,116.35754654249999,125.27760946499998,134.19767238749998,143.11773530999997,152.03779823249997,160.95786115500002,169.8779240775,178.797987]},"sample":[-15.5098908,15.4550242,121.0875744,119.6203696,14.3239409,-3.7727534,-2.3966705,7.8535761,-5.9737758,9.4850781,-5.9726768,11.5650314,12.1835225,40.432634,5.8260171,8.0470913,10.2553703,-4.4238299,-3.7267943,-4.2310289,-3.7286759,-3.8846469,-3.6156697,34.3439457,177.4775685,16.5997821,-72.1643185,16.213532,15.986138,15.4750108,48.9278497,15.497965,16.5563852,11.6804856,11.706104,11.6311813,12.9507321,12.1680826,15.2343191,15.8013603,14.2551978,10.4128783,92.8981017,-5.7237169,-5.7653464,98.8220118,11.8748477,61.3261572,-0.3042288,-0.2989654,3.3373185,34.5582737,10.2149166,39.7474183,14.4932432,2.8777864,15.8667368,5.7164189,-90.4296216,17.2558661,15.836364,172.1810925,15.4141051,122.5201321,15.034872,-81.5865425,15.6117908,16.0603355,16.5780341,16.94735,15.1428702,3.050117,125.8693764,15.1363137,13.8160793,4.4769191,13.8806984,14.9434162,40.237651,15.801874,44.6983983,11.682067,14.7982917,-124.3645441,13.6545513,58.1471214,13.5540844,2.0022955,-32.458066,-17.9313204,15.3661829,15.3566,11.2376208,3.0356458,5.7583129,13.891239,8.3732112,8.2995056,-4.2766696,14.6748252,0.0328824,11.6667694,119.6353829,40.8516641,-124.9109378,11.2514356,15.685483,0.1996285,9.5210968,4.9575854,0.1099391,14.6685533,20.68067,19.66892,20.445358,15.93981,20.6904601,-0.4046283,14.9707782,39.3670022,19.8200752,22.7655004,15.6804135,42.5686696,2.4469674,41.9149093,-0.5698198,16.8309924,-115.5361904,16.0591122,5.725893,15.4275513,-17.135134,19.7550274,151.6466488,-0.6074695,11.5641315,2.7066234,15.9556783,14.1819492,2.8097751,3.1084904,24.8223,15.714614,11.59318,20.7273419,35.3323983,5.5432437,15.7889266,22.0943692,15.7768357,15.0348646,15.7763187,11.6211941,16.3037047,11.8038808,131.6441667,13.9209029,15.7986997,117.1854825,19.2047903,5.3776685,12.9738803,12.9632807,17.6829176,12.6000496,12.5853336,15.0931688,18.4834955,16.1628647,2.009133,1.86385,-3.5103526,12.527671,12.4059891,13.4379444,6.8105351,5.2603335,-0.1693562,21.3178988,2.0920842,10.1230959,10.3265524,10.3266952,2.015945,11.8657786,-73.0643782,14.2811973,14.2812234,104.4485839,0.1261292,20.6342391,13.8321891,-76.4470674,25.6004191,-0.2260469,14.82043,7.3255967,15.7496884,2.9578436,1.4942462,1.3038327,-2.6309983,15.747046,-2.5736142,14.1697579,-4.7950423,21.9089104,10.8280791,98.7354574,19.4020191,15.7945174,25.1927489,21.1309483,14.596453,-16.6965003,11.7304847,-9.222163,44.0747054,22.4209935,14.0520378,-6.2442811,-1.8439661,15.9213333,138.9534805,14.3656569,13.7121693,-116.6956937,110.3060816,2.7977622,2.7813582,52.6893157,2.5860631,2.5688252,2.5631302,2.5436541,2.4231581,2.5756871,2.9953841,3.2999281,2.5445061,12.6845646,13.0867553,31.9852714,0.9936565,15.6896847,-0.6729273,15.6838819,15.0567673,2.2886742,8.7983017,42.6039971,39.286669,-73.8322556,-0.1326916,-16.7762078,19.222884,116.0669956,-77.5651529,-77.5649129,-77.5534123,-77.2111094,-77.2757437,-76.3327998,-77.2068832,-77.7569974,13.9236098,5.7806584,6.5807786,20.4492655,45.9483368,-71.9980417,5.5938807,13.7945842,7.8747851,14.7485916,12.9827392,5.9111063,3.3829924,6.359215,45.6875813,-5.9848432,19.4019406,22.3192585,10.1669663,10.723439,15.0073687,0.246947,0.1790368,0.1816612,0.1462078,-0.3735127,8.7884696,19.4176704,3.601209,-78.3642203,-37.7972196,-105.493465,3.757361,23.0654066,10.9342943,19.1839173,21.918199,6.1902566,138.652353,33.7322481,17.099269,-0.5911665,17.1293772,13.6958793,3.8122561,15.1806636,23.8083049,-0.1550936,14.2969822,15.0603917,40.7548374,-13.6735242,19.8647306,15.738019,9.5963981,1.6425198,-123.0496345,1.0917639,6.798318,2.9829876,49.041857,18.58654,40.0961989,-2.1318859,-2.1365301,-121.1784558,115.7002389,19.0521678,35.2361482,8.620709,15.172568,5.11447,15.9359263,1.320481,-89.3634935,-0.0100608,3.623575,21.5950432,0.2398263,15.9486714,15.102371,15.0728944,2.1414804,2.7462642,2.7468063,0.5385814,1.5433671,11.1180276,0.4422506,0.4347293,3.769085,3.7650699,-0.3014348,19.751041,134.4891808,5.3300604,3.7427977,14.8778833,1.9517559,114.2707553,5.6033512,18.4859489,-122.220903,11.5705828,11.5705101,6.9476835,12.572324,11.0549873,10.9225798,5.6636607,23.3156653,150.0145861,-1.5714759,20.5020407,0.3032379,69.9207669,27.3922177,-3.1627547,-3.1097656,115.7318295,0.4317894,5.5747,10.2220959,33.531846,16.195767,67.7736982,15.9583921,15.8750284,12.0795184,11.1901833,11.1757389,5.6917833,4.9705508,-13.8433658,46.5306166,18.4804228,9.4189536,-9.4672752,2.4020791,3.7926904,24.6872951,46.4288308,77.1492744,18.6378535,5.8174811,20.9232245,21.0008222,46.5170747,-2.4955,15.3055912,18.5065622,21.2873853,19.5839009,10.2139884,10.221014,10.2301063,-8.791816,11.8879389,10.2302653,10.286781,11.7349043,10.4686116,11.8859761,10.3408651,10.2890883,11.6507277,10.3287844,10.3402474,10.3321311,11.2843578,10.2345787,0.0854766,-3.7047275,12.5638083,44.3889955,-2.1748408,-2.6729143,4.4030608,-2.2614276,-110.0752041,45.6619586,10.498667,7.9892793,118.0590659,18.4662783,2.7914052,3.2181087,121.690465,6.322886,10.4214082,-2.7046223,20.7787386,-60.4499977,0.2302018,14.7548199,25.2332005,-100.4570267,2.2403061,13.6323306,7.6400942,2.0152644,5.650725,14.2063214,20.6930789,3.7419849,20.4985636,8.7732777,18.4812847,3.6334133,20.4605783,-123.1855927,6.9800715,13.6924435,15.2824363,35.2192558,-7.3754701,-16.8204516,12.8436916,-2.5120862,-0.3112497,6.8975195,148.2092758,7.5948799,-77.5102792,17.5862849,121.4141397,-0.5954179,15.0185008,-0.5319244,17.133919,17.1275396,16.0430255,-3.3449158,-0.0931799]},"kind":"numeric","n":69716,"n_null":0,"n_unique":69585,"null_rate":0.0,"stats":{"iqr":16.939316025,"kurtosis":4.509206314320611,"max":178.797987,"mean":12.02535771042372,"median":11.37646115,"min":-178.0045299,"n_outliers":11302,"outlier_rate":0.16211486602788455,"q1":1.244825925,"q3":18.18414195,"skew":0.27550583587888633,"std":40.499807085255306,"zero_rate":0.0}},{"alerts":[{"code":"one_word","level":"warn","message":"94.3% rows are a single word"},{"code":"short_text","level":"info","message":"95th-percentile length under 20 chars"},{"code":"duplicates","level":"warn","message":"94.7% duplicate strings"}],"column":"description","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[65286,422,544,501,458,437,344,218,205,170,229,85,70,60,54,48,51,42,34,34,26,24,23,24,19,13,27,13,18,21,20,12,23,18,16,9,8,17,22,71],"edges":[0.0,6.375,12.75,19.125,25.5,31.875,38.25,44.625,51.0,57.375,63.75,70.125,76.5,82.875,89.25,95.625,102.0,108.375,114.75,121.125,127.5,133.875,140.25,146.625,153.0,159.375,165.75,172.125,178.5,184.875,191.25,197.625,204.0,210.375,216.75,223.125,229.5,235.875,242.25,248.625,255.0]},"near_unique":false,"sample":["","","","","unerforschtes, nordschauendes Portal","","","","","","N\u00b0 3120 del Catasto Speleologico Regionale del Friuli Venezia Giulia","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","",""],"top_values":[["",65189],["nicht katasterw\u00fcrdig",68],["unterer Eingang",31],["oberer Eingang",23],["Halbh\u00f6hle",21],["fluviokrasov\u00e1",21],["Schluf",17],["Osteingang",16],["Westeingang",15],["Entr\u00e9e d'une carri\u00e8re souterraine",15],["Erdstall",14],["Nische, nicht katasterw\u00fcrdig",13],["Not really caves but man-made rock caves",13],["lava cave",12],["Ez da haitzuloa, leizea, kobazuloa edo harpea, izenak adierazten duen bezala, baizik eta arku harritsu natural bat (begia, leihoa edo tunela) No es una cueva o abrigo rocoso como el nombre podr\u00eda indicar pero un arco rocoso natural (ojo, ventana o t\u00fanel)",11],["cave difficulty: easy",10],["unerforscht",10],["kleine Halbh\u00f6hle",9],["NW-Eingang",9],["S-Eingang",9]],"top_words":[["de",304],["m",147],["del",110],["in",104],["a",103],["the",99],["mit",92],["nicht",85],["cave",83],["katasterw\u00fcrdig",69],["eingang",62],["la",54],["der",53],["of",52],["h\u00f6hle",50],["cova",49],["da",46],["catasto",45],["n\u00b0",43],["speleologico",43],["regionale",43],["friuli",43],["venezia",43],["and",43],["di",40]],"vocab_skipped":null,"word_histogram":{"counts":[66241,908,750,362,309,335,139,51,88,65,63,26,43,46,18,41,39,34,12,19,34,21,14,31,8,10,3,2,1,3],"edges":[1.0,2.7333333333333334,4.466666666666667,6.2,7.933333333333334,9.666666666666668,11.4,13.133333333333333,14.866666666666667,16.6,18.333333333333336,20.066666666666666,21.8,23.533333333333335,25.266666666666666,27.0,28.733333333333334,30.46666666666667,32.2,33.93333333333334,35.66666666666667,37.4,39.13333333333333,40.86666666666667,42.6,44.333333333333336,46.06666666666667,47.800000000000004,49.53333333333333,51.266666666666666,53.0]}},"kind":"text","n":69716,"n_null":0,"n_unique":3705,"null_rate":0.0,"stats":{"allcaps_rate":0.0024097768087669976,"boilerplate_rate":1.4343909575994034e-05,"duplicate_rate":0.9468558150209421,"emoji_rate":0.0,"len_max":255,"len_mean":3.4617591370703997,"len_median":0.0,"len_min":0,"len_p95":19.0,"n_duplicates":66011,"n_empty":65189,"one_word_rate":0.9427534568822078,"readability_flesch_mean":1.7521209709294931,"url_rate":0.0006311320213437375,"vocab_size":4651,"word_mean":1.4554908485856906,"word_median":1.0}},{"alerts":[],"column":"access","extras":{"singletons":6,"top_values":[["",62551],["yes",2717],["no",2266],["private",815],["permit",575],["permissive",440],["customers",271],["unknown",47],["destination",11],["restricted",9],["tidal",2],["request",2],["key",2],["discouraged",2],["designated",1],["official",1],["forestry",1],["agricultural",1],["guided",1],["university",1]]},"kind":"categorical","n":69716,"n_null":0,"n_unique":20,"null_rate":0.0,"stats":{"cardinality":20,"entropy":0.7067450003454716,"entropy_ratio":0.1635253953395286,"top_rate":0.8972258878880027,"top_value":""}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 97.2% of rows"}],"column":"tourism","extras":{"singletons":5,"top_values":[["",67776],["attraction",1670],["viewpoint",119],["yes",105],["camp_site",7],["museum",6],["register",6],["artwork",6],["information",5],["picnic_site",4],["cave_entrance",3],["caves",2],["wilderness_hut",2],["attraction;museum",1],["guestbook",1],["no",1],["cave",1],["hotel",1]]},"kind":"categorical","n":69716,"n_null":0,"n_unique":18,"null_rate":0.0,"stats":{"cardinality":18,"entropy":0.2076157840602457,"entropy_ratio":0.04978885327396407,"top_rate":0.9721728154225716,"top_value":""}},{"alerts":[{"code":"one_word","level":"warn","message":"97.6% rows are a single word"},{"code":"short_text","level":"info","message":"95th-percentile length under 20 chars"},{"code":"duplicates","level":"warn","message":"97.0% duplicate strings"}],"column":"wikipedia","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[67531,0,42,85,252,402,335,445,243,131,102,72,33,13,12,6,4,1,1,1,3,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1],"edges":[0.0,2.85,5.7,8.55,11.4,14.25,17.1,19.95,22.8,25.650000000000002,28.5,31.35,34.2,37.050000000000004,39.9,42.75,45.6,48.45,51.300000000000004,54.15,57.0,59.85,62.7,65.55,68.4,71.25,74.10000000000001,76.95,79.8,82.65,85.5,88.35000000000001,91.2,94.05,96.9,99.75,102.60000000000001,105.45,108.3,111.15,114.0]},"near_unique":false,"sample":["","","","","","","","","","","","sq:Shpella e Kusarit","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","",""],"top_values":[["",67531],["ru:\u0421\u0438\u043a\u0438\u044f\u0437-\u0422\u0430\u043c\u0430\u043a",6],["de:Ein\u00f6dh\u00f6hle",5],["de:H\u00f6llgrotten",5],["ca:Forat de Bul\u00ed",5],["en:Buchan Caves",4],["fr:Carri\u00e8re de Lanaye Inf\u00e9rieure",4],["ca:Espluga d'en Pon\u00e7a",4],["de:Sch\u00f6nsteinh\u00f6hle",3],["de:Finsteres Loch (Schw\u00e4bische Alb)",3],["en:Clifden Limestone Caves",3],["en:Elephanta Caves",3],["de:Badlh\u00f6hle",3],["es:Cueva de los Tayos",3],["hu:Barlangok a Bakonyban",3],["de:Grj\u00f3tagj\u00e1",2],["ru:\u041a\u0443\u043d\u0433\u0443\u0440\u0441\u043a\u0430\u044f \u043f\u0435\u0449\u0435\u0440\u0430",2],["de:Bingh\u00f6hle",2],["de:Lurgrotte",2],["de:Frauenmauerh\u00f6hle",2]],"top_words":[["de",83],["cave",44],["fr:grotte",36],["pl:jaskinia",24],["es:cueva",21],["la",17],["di",17],["it:grotta",16],["del",15],["ca:cova",15],["jasky\u0148a",13],["\u043f\u0435\u045b\u0438\u043d\u0430",13],["du",13],["des",11],["ro:pe\u0219tera",10],["fr:grottes",9],["w",8],["jama",8],["it:grotte",7],["\u043f\u0435\u0449\u0435\u0440\u0430",6],["caves",6],["los",6],["h\u00f6hle",5],["pt:gruta",5],["pe\u0107ina",5]],"vocab_skipped":null,"word_histogram":{"counts":[68017,0,816,0,549,0,251,0,48,0,19,0,10,0,0,4,0,1,0,0,0,0,0,0,0,0,0,0,0,1],"edges":[1.0,1.4666666666666668,1.9333333333333333,2.4,2.8666666666666667,3.3333333333333335,3.8,4.266666666666667,4.733333333333333,5.2,5.666666666666667,6.133333333333334,6.6,7.066666666666666,7.533333333333333,8.0,8.466666666666667,8.933333333333334,9.4,9.866666666666667,10.333333333333334,10.8,11.266666666666667,11.733333333333334,12.2,12.666666666666666,13.133333333333333,13.6,14.066666666666666,14.533333333333333,15.0]}},"kind":"text","n":69716,"n_null":0,"n_unique":2077,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.9702076998106604,"emoji_rate":0.0,"len_max":114,"len_mean":0.6359802627804234,"len_median":0.0,"len_min":0,"len_p95":0.0,"n_duplicates":67639,"n_empty":67531,"one_word_rate":0.9756296976303861,"readability_flesch_mean":-0.024849999999999425,"url_rate":0.0,"vocab_size":940,"word_mean":1.0439497389408456,"word_median":1.0}},{"alerts":[{"code":"one_word","level":"warn","message":"100.0% rows are a single word"},{"code":"short_text","level":"info","message":"95th-percentile length under 20 chars"},{"code":"duplicates","level":"warn","message":"96.4% duplicate strings"}],"column":"website","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[67082,0,11,45,130,161,109,118,86,101,223,45,49,1360,127,16,14,8,2,5,5,0,5,1,6,0,0,0,1,1,0,0,0,1,2,0,1,0,0,1],"edges":[0.0,6.375,12.75,19.125,25.5,31.875,38.25,44.625,51.0,57.375,63.75,70.125,76.5,82.875,89.25,95.625,102.0,108.375,114.75,121.125,127.5,133.875,140.25,146.625,153.0,159.375,165.75,172.125,178.5,184.875,191.25,197.625,204.0,210.375,216.75,223.125,229.5,235.875,242.25,248.625,255.0]},"near_unique":false,"sample":["","","","","","https://termeszetvedelem.hu/talalati-oldal/?type=orszagos-barlangnyilvantartas&id=4762-23","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","","",""],"top_values":[["",67082],["https://www.angloasianmining.com/",19],["https://akkh.de/",7],["https://www.noe.gv.at/natural_monuments/7cf5f4b1-dc06-4ea7-b6dd-5f2c5aad62d7.PDF",6],["https://whc.unesco.org/en/list/1527/",4],["https://termeszetvedelem.hu/talalati-oldal/?type=orszagos-barlangnyilvantartas&id=5430-1",4],["https://termeszetvedelem.hu/talalati-oldal/?type=orszagos-barlangnyilvantartas&id=4840-1",4],["https://carrodillasostenible.wordpress.com/2011/05/01/cuevas/",4],["http://www.nicau.be/galeries/lanayeinf/1.html",4],["https://termeszetvedelem.hu/talalati-oldal/?type=orszagos-barlangnyilvantartas&id=4762-1",4],["https://termeszetvedelem.hu/talalati-oldal/?type=orszagos-barlangnyilvantartas&id=4762-2",4],["https://termeszetvedelem.hu/talalati-oldal/?type=orszagos-barlangnyilvantartas&id=4450-1",3],["https://www.vanschaikstichting.nl/index.php/groeven/groeve-de-keel",3],["https://termeszetvedelem.hu/talalati-oldal/?type=orszagos-barlangnyilvantartas&id=4773-1",3],["https://www.doc.govt.nz/parks-and-recreation/places-to-go/southland/places/clifden-area/?tab-id=Caving",3],["https://whc.unesco.org/en/list/244",3],["https://kulturdb.de/einobjekt.php?id=1516",3],["https://www.speleork.sk/",3],["https://termeszetvedelem.hu/talalati-oldal/?type=orszagos-barlangnyilvantartas&id=5430-3",3],["https://jaskiniepolski.pgi.gov.pl/Details/Information/2997",3]],"top_words":[["https://www.angloasianmining.com/",6],["https://termeszetvedelem.hu/talalati-oldal/?type=orszagos-barlangnyilvantartas&id=4521-72",2],["https://grupoedelweiss.com/pdf/cubia6-b.pdf",2],["https://www.catastospeleologicoregionale.sardegna.it/",2],["https://www.noe.gv.at/natural_monuments/7cf5f4b1-dc06-4ea7-b6dd-5f2c5aad62d7.pdf",2],["https://whc.unesco.org/en/list/1527/",2],["https://termeszetvedelem.hu/talalati-oldal/?type=orszagos-barlangnyilvantartas&id=4840-1",2],["https://www.youtube.com/watch?v=t9cpiirshrk",2],["https://termeszetvedelem.hu/talalati-oldal/?type=orszagos-barlangnyilvantartas&id=5372-87",2],["https://jaskiniepolski.pgi.gov.pl/details/information/2997",2],["https://termeszetvedelem.hu/talalati-oldal/?type=orszagos-barlangnyilvantartas&id=4450-1",2],["https://www.cretanbeaches.com/en/caves/samonas-cave",1],["https://termeszetvedelem.hu/talalati-oldal/?type=orszagos-barlangnyilvantartas&id=5452-67",1],["https://geo.regione.emilia-romagna.it/schede/speleo/index.jsp?id=723",1],["https://www.ennstalwiki.at/wiki/index.php/frauenbild_pass_stein",1],["https://termeszetvedelem.hu/talalati-oldal/?type=orszagos-barlangnyilvantartas&id=5452-89",1],["http://www.mersch.lu/4b%20mersch%20-%20prehistorical%20remains.pdf?fileid=publications%2f4b+mersch+-+prehistorical+remains.pdf",1],["https://www.katasterjam.si/caves/details/1395",1],["https://termeszetvedelem.hu/talalati-oldal/?type=orszagos-barlangnyilvantartas&id=2891-1",1],["https://termeszetvedelem.hu/talalati-oldal/?type=orszagos-barlangnyilvantartas&id=5451-36",1],["https://geo.regione.emilia-romagna.it/schede/speleo/index.jsp?id=456",1],["https://termeszetvedelem.hu/talalati-oldal/?type=orszagos-barlangnyilvantartas&id=4840-208",1],["http://www.infos-escalade.be/ausny/ausny.htm",1],["https://termeszetvedelem.hu/talalati-oldal/?type=orszagos-barlangnyilvantartas&id=2891-13",1],["https://www.vanschaikstichting.nl/index.php/groeven/groeve-de-keel",1]],"vocab_skipped":null,"word_histogram":{"counts":[69715,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1],"edges":[1.0,1.0333333333333334,1.0666666666666667,1.1,1.1333333333333333,1.1666666666666667,1.2,1.2333333333333334,1.2666666666666666,1.3,1.3333333333333333,1.3666666666666667,1.4,1.4333333333333333,1.4666666666666668,1.5,1.5333333333333332,1.5666666666666667,1.6,1.6333333333333333,1.6666666666666665,1.7,1.7333333333333334,1.7666666666666666,1.8,1.8333333333333335,1.8666666666666667,1.9,1.9333333333333333,1.9666666666666668,2.0]}},"kind":"text","n":69716,"n_null":0,"n_unique":2492,"null_rate":0.0,"stats":{"allcaps_rate":1.4343909575994034e-05,"boilerplate_rate":0.0,"duplicate_rate":0.9642549773366229,"emoji_rate":0.0,"len_max":255,"len_mean":2.7889580584084,"len_median":0.0,"len_min":0,"len_p95":0.0,"n_duplicates":67224,"n_empty":67082,"one_word_rate":0.999985656090424,"readability_flesch_mean":-24.041499999999996,"url_rate":0.0377531700040163,"vocab_size":737,"word_mean":1.0000143439095759,"word_median":1.0}},{"alerts":[{"code":"long_tail","level":"info","message":"158 singleton categories"},{"code":"imbalance","level":"warn","message":"top value is 99.1% of rows"}],"column":"cave:length","extras":{"singletons":158,"top_values":[["",69074],["5",32],["6",26],["10",25],["3",23],["4",23],["7",20],["8",19],["15",16],["20",14],["12",13],["30",13],["2",11],["11",9],["60",8],["4.5",8],["13",8],["16",8],["17",8],["25",8]]},"kind":"categorical","n":69716,"n_null":0,"n_unique":238,"null_rate":0.0,"stats":{"cardinality":238,"entropy":0.1392135600548953,"entropy_ratio":0.017633536862865413,"top_rate":0.9907912100522118,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"87 singleton categories"},{"code":"imbalance","level":"warn","message":"top value is 99.6% of rows"}],"column":"cave:depth","extras":{"singletons":87,"top_values":[["",69419],["0",63],["10",13],["3",11],["1",9],["5",9],["4",8],["25",7],["30",6],["6",6],["2",6],["11",5],["35",5],["28",4],["14",4],["40",4],["70",4],["12",3],["8",3],["15",3]]},"kind":"categorical","n":69716,"n_null":0,"n_unique":124,"null_rate":0.0,"stats":{"cardinality":124,"entropy":0.06432301503539317,"entropy_ratio":0.009249525346202768,"top_rate":0.9957398588559297,"top_value":""}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"country","extras":{"singletons":8,"top_values":[["",69684],["KY",7],["AU",6],["DE",3],["RO",2],["US",2],["EC",2],["IT",2],["GB",1],["MT",1],["CH",1],["GR",1],["ET",1],["LB",1],["VN",1],["PT",1]]},"kind":"categorical","n":69716,"n_null":0,"n_unique":16,"null_rate":0.0,"stats":{"cardinality":16,"entropy":0.007359773467821954,"entropy_ratio":0.0018399433669554885,"top_rate":0.9995409948935682,"top_value":""}}],"insights":{"errors":[],"insights":[{"confidence":"high","critiques":[],"evidence_keys":["row_count","column_count","columns.name.top_values","columns.name.stats.duplicate_rate","columns.description.stats.n_empty","columns.website.stats.n_empty","columns.wikipedia.stats.n_empty","columns.lat.stats.skew","columns.lat.stats.outlier_rate","columns.lon.stats.outlier_rate","columns.country.stats.top_rate","columns.access.top_values","columns.tourism.top_values"],"featured_charts":[{"caption":"Check the left-skewed latitude distribution to see how heavily caves cluster in the Northern Hemisphere.","column":"lat","kind":"histogram"},{"caption":"Longitude spread reveals the European core versus scattered entries across the Americas and Asia-Pacific.","column":"lon","kind":"histogram"},{"caption":"Among rows that specify access, compare yes/no/private/permit to gauge how reachable tagged caves are.","column":"access","kind":"bar"},{"caption":"Note that 'attraction' dominates the tagged tourism values, dwarfing viewpoints, museums, and other uses.","column":"tourism","kind":"bar"},{"caption":"Name lengths center around 13 characters, but watch for the huge 'Unnamed Cave' spike inflating duplicates.","column":"name","kind":"length"}],"model":"anthropic:claude-opus-4-7","narrative":"This dataset catalogs 69,716 caves with 12 columns covering names, geocoordinates, country, tourism/access tags, and optional metadata like description, website, and Wikipedia links. The headline issue is sparsity in the descriptive fields: 'description' is empty in 65,189 rows, 'website' in 67,082, and 'wikipedia' in 67,531, so most analytical signal sits in name and coordinates. Worth a closer look first: the 'name' column, where 19,527 entries are literally 'Unnamed Cave' and overall duplicate rate is 35%, and the geographic spread, where 'lat' is heavily left-skewed (skew -3.16) with ~12.9% outliers and 'lon' has ~16.2% outliers, suggesting a Northern-Hemisphere/European concentration with scattered global entries. The 'country' field is almost entirely blank (99.95%), so country-level analysis will need to be derived from coordinates rather than read off directly. 'Access' is the most usable categorical, with meaningful splits across yes/no/private/permit when present.","scope":"dataset","target":"__global__"},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.skew","stats.kurtosis","stats.zero_rate","stats.n_outliers"],"model":"anthropic:claude-opus-4-7","narrative":"This column is almost certainly a row identifier: all 69716 values are unique with zero nulls, and the numeric range spans roughly 1.28e7 to 1.354e10 with near-zero skew (0.02) and negative kurtosis (-1.18), consistent with broadly distributed assigned IDs rather than a measured quantity. No outliers or zeros are flagged. Treat the numeric stats as incidental \u2014 the magnitudes carry no analytical meaning.","role":"identifier","scope":"column","target":"id","treatment":"Drop from modelling; retain only as a join key."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","duplicate_rate","n_duplicates","top_values","top_words","len_mean","word_mean","vocab_size"],"model":"anthropic:claude-opus-4-7","narrative":"Short free-text names of caves/caverns in mixed languages (English 'Cave', French 'Grotte', Italian 'Grotta', Spanish 'Cueva', Cyrillic '\u0413\u0440\u043e\u0442', German 'B\u00e4renh\u00f6hle'), averaging 2.5 words and 15.5 characters. Severe duplication (35.1%, 24,487 rows) is dominated by the placeholder 'Unnamed Cave' appearing 19,527 times \u2014 over a quarter of all rows are effectively unlabelled. Of 69,716 rows only 45,229 are unique, and the vocabulary of 15,219 tokens reflects the multilingual mix.","role":"label","scope":"column","target":"name","treatment":"Treat 'Unnamed Cave' as missing and language-normalise before any text matching or grouping."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","median","mean","skew","kurtosis","iqr","n_outliers","outlier_rate","n","n_unique","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Latitude coordinates spanning -77.98 to 78.18, so the column covers nearly the full globe from Antarctic to Arctic ranges. The distribution is heavily left-skewed (skew -3.16, kurtosis 11.5) with a tight IQR of 7.26 around a median of 44.14, indicating most points cluster in northern mid-latitudes while a long tail of southern-hemisphere values produces 8,996 outliers (12.9%). Near-unique values (69,544 of 69,716) confirm these are precise geocoordinates rather than bucketed regions.","role":"feature","scope":"column","target":"lat","treatment":"Pair with longitude for geospatial features; consider binning or projecting rather than treating as a raw scalar."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","mean","median","q1","q3","std","n","n_unique","null_rate","zero_rate","outlier_rate","n_outliers","skew","kurtosis"],"model":"anthropic:claude-opus-4-7","narrative":"This is a longitude coordinate, with values spanning the full -178.00 to 178.80 range and 69,585 unique values across 69,716 rows. The distribution is centered near 12.03 (median 11.38) with IQR 1.24 to 18.18, suggesting a heavy concentration in European/African longitudes, but the std of 40.50 and 16.2% flagged outliers reveal a long global tail. No nulls or zeros are present.","role":"feature","scope":"column","target":"lon","treatment":"Pair with latitude for geospatial features; do not treat outliers as errors since the global range is legitimate."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.duplicate_rate","stats.n_empty","stats.len_mean","stats.word_median","stats.one_word_rate","stats.vocab_size","top_values","top_words"],"model":"anthropic:claude-opus-4-7","narrative":"A free-text 'description' field, but 65189 of 69716 rows (94.7% duplicate rate) are empty strings, leaving only ~4500 populated entries with a mean length of 3.46 characters and median word count of 1. The non-empty values are short multilingual fragments \u2014 German ('nicht katasterw\u00fcrdig', 'unterer Eingang'), French ('Entr\u00e9e d'une carri\u00e8re souterraine'), and other tokens like 'cave' and 'Halbh\u00f6hle' \u2014 suggesting cave/feature annotations rather than prose. With 92.8% one-word rate and a vocab of 4651, this is closer to sparse tagging than narrative text.","role":"free_text","scope":"column","target":"description","treatment":"Treat as sparse optional tag: flag presence as a boolean feature and ignore the text body unless modelling the populated subset."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Categorical access-permission tag, almost certainly the OSM-style `access` key indicating who may use a feature. 89.7% of the 69,716 rows are empty strings, leaving only ~10% with substantive values like `yes` (2,717), `no` (2,266), `private` (815), `permit` (575), and `permissive` (440). Entropy ratio is just 0.16 and 20 distinct values appear, so the signal is sparse but the long tail (`customers`, `destination`, `restricted`, `unknown`) is meaningful when present.","role":"feature","scope":"column","target":"access","treatment":"Treat empty string as missing, then collapse rare levels and one-hot encode the survivors."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This is an OSM-style `tourism` tag categorising features like attractions, viewpoints, and museums across 18 distinct values. The column is severely imbalanced: 97.2% of the 69,716 rows are empty strings, with `attraction` (1,670) and `viewpoint` (119) the only non-trivial categories. Entropy ratio of 0.05 confirms almost no information content as-is.","role":"feature","scope":"column","target":"tourism","treatment":"Treat empty string as missing and either drop or collapse rare categories into a binary `is_tourism` flag."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","stats.duplicate_rate","stats.n_empty","stats.one_word_rate","stats.len_max","stats.vocab_size","top_values","top_words"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds Wikipedia article references in the OSM-style `lang:Article Title` format (e.g. `de:Ein\u00f6dh\u00f6hle`, `fr:Grotte...`), mostly pointing to cave-related pages across many languages. It is overwhelmingly empty: 67,531 of 69,716 rows are blank and the duplicate rate is 0.97, leaving only 2,077 unique values. Among the populated entries, language prefixes span de, fr, pl, es, it, ca, en, ru and more, so any downstream use must handle multilingual strings.","role":"metadata","scope":"column","target":"wikipedia","treatment":"Split into language prefix and title, and treat as a sparse optional reference rather than a modelling feature."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","n_empty","duplicate_rate","one_word_rate","word_mean","url_rate","top_values","len_max"],"model":"anthropic:claude-opus-4-7","narrative":"This is a website/URL field for each record, but it is overwhelmingly empty: 67,082 of 69,716 rows (n_empty) are blank, leaving only 2,492 unique values across the column. Where populated, entries are single-token URLs (one_word_rate 0.99998, word_mean ~1.0) pointing to varied external domains (angloasianmining.com, unesco.org, termeszetvedelem.hu, etc.). The duplicate_rate of 0.96 is driven almost entirely by the empty string, and url_rate is only 0.038 because the metric is computed over all rows including blanks.","role":"metadata","scope":"column","target":"website","treatment":"Treat as optional reference URL; impute missing as null and avoid using as a feature given >96% blanks."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a cave length attribute (likely OpenStreetMap-style tag) stored as a string, with 99.08% of the 69,716 rows being empty and only 238 distinct values overall. When populated, values look like small integers (5, 6, 10, 3, 4...) suggesting metres, but the signal is so sparse (entropy ratio 0.0176) that it carries almost no information. The non-null counts in the top values are tiny (\u226432 each), indicating this tag is rarely filled in upstream.","role":"metadata","scope":"column","target":"cave:length","treatment":"Drop or convert to a numeric 'has_length' indicator; the column is too sparse to model directly."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a cave depth attribute, likely sourced from an OpenStreetMap-style tag, stored as strings. It is effectively empty: 69,419 of 69,716 rows (top_rate 0.9957) carry the blank value \"\", and the remaining 124 distinct values are tiny integer-like strings ranging from \"0\" to \"30\" with single- or low-double-digit counts. Entropy ratio of 0.0092 confirms there is virtually no signal here.","role":"metadata","scope":"column","target":"cave:depth","treatment":"Drop; near-constant blank with negligible entropy."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Two-letter ISO country code, but effectively empty: 69,684 of 69,716 rows (top_rate 0.9995) carry a blank string, leaving only 32 rows spread across 15 actual codes (KY, AU, DE, RO, US, etc.). Entropy ratio of 0.0018 confirms there is essentially no signal here. No nulls are reported because the missingness is encoded as empty string rather than NULL.","role":"feature","scope":"column","target":"country","treatment":"Drop; near-constant empty string with only 32 populated rows."}],"providers":["anthropic:claude-opus-4-7"],"total_usage":{"completion_tokens":4500,"prompt_tokens":18279,"total_tokens":22779}},"language_counts":{},"meta":{"generated_at":"2026-05-01T23:17:16+00:00","mode":"full","row_count":69716,"sampled_rows":69716,"seed":42,"source":"/home/coolhand/html/datavis/data_trove/data/quirky/caves.json"},"notes":[],"saturn_version":"0.2.0","schema":{"access":"categorical","cave:depth":"categorical","cave:length":"categorical","country":"categorical","description":"text","id":"numeric","lat":"numeric","lon":"numeric","name":"text","tourism":"categorical","website":"text","wikipedia":"text"}}
