{"columns":[{"alerts":[{"code":"near_unique","level":"info","message":"100.0% of rows are unique strings"},{"code":"one_word","level":"warn","message":"73.1% rows are a single word"}],"column":"n","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[25,193,748,1095,1082,833,521,333,271,231,208,213,188,199,144,91,75,68,63,69,150,48,26,30,21,8,7,10,14,6,8,2,10,1,4,0,1,0,1,1],"edges":[1.0,2.05,3.1,4.15,5.2,6.25,7.300000000000001,8.350000000000001,9.4,10.450000000000001,11.5,12.55,13.600000000000001,14.65,15.700000000000001,16.75,17.8,18.85,19.900000000000002,20.95,22.0,23.05,24.1,25.150000000000002,26.200000000000003,27.25,28.3,29.35,30.400000000000002,31.450000000000003,32.5,33.550000000000004,34.6,35.65,36.7,37.75,38.800000000000004,39.85,40.9,41.95,43.0]},"near_unique":true,"sample":["Abaza","Rajbanshi","T\u00e0y","Solos","Kachi Koli","Yangum Gel","Eastern Krahn","San Mart\u00edn Itunyoso Triqui","Sonia","Angal Enen","Mouk-Aria","Mandan","West Goodenough","Abureni","Batuley","Ndzwani Comorian","Baraamu","Suwawa","Santa Catarina Albarradas Zapotec","Khalaj","Hiw","Anjam","Chambri","Bassa-Kontagora","Oroha","Tavringer Romani","Mawak","Cuiba","Kenati","Yarawata","Ngbaka Ma'bo","Zimakani","Car Nicobarese","Kayagar","Cashibo-Cacataibo","Kota (Gabon)","Wakhi","Madak","Kula","Mambai","Sinhala","Vame","Gobu","Vai","Wolio","Yintale Karen","New Caledonian Javanese","Baram Kayan","Southern Carrier","Toaripi"],"top_values":[],"top_words":[["language",145],["sign",144],["southern",69],["northern",64],["zapotec",57],["mixtec",52],["western",51],["eastern",48],["central",45],["naga",43],["creole",33],["quechua",33],["arabic",32],["new",31],["guinea)",28],["nahuatl",28],["(papua",27],["north",26],["chin",26],["malay",26],["san",22],["south",20],["english",20],["dogon",19],["(nigeria)",18]],"vocab_skipped":null,"word_histogram":{"counts":[5118,0,0,0,0,0,1345,0,0,0,0,0,401,0,0,0,0,0,103,0,0,0,0,0,27,0,0,0,0,4],"edges":[1.0,1.1666666666666667,1.3333333333333333,1.5,1.6666666666666665,1.8333333333333333,2.0,2.1666666666666665,2.333333333333333,2.5,2.6666666666666665,2.833333333333333,3.0,3.1666666666666665,3.333333333333333,3.5,3.6666666666666665,3.833333333333333,4.0,4.166666666666666,4.333333333333333,4.5,4.666666666666666,4.833333333333333,5.0,5.166666666666666,5.333333333333333,5.5,5.666666666666666,5.833333333333333,6.0]}},"kind":"text","n":6998,"n_null":0,"n_unique":6998,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.0,"emoji_rate":0.0,"len_max":43,"len_mean":8.971991997713632,"len_median":7.0,"len_min":1,"len_p95":21.0,"n_duplicates":0,"n_empty":0,"one_word_rate":0.7313518148042297,"readability_flesch_mean":57.130225000000024,"url_rate":0.0,"vocab_size":7003,"word_mean":1.3692483566733353,"word_median":1.0}},{"alerts":[],"column":"lat","extras":{"histogram":{"counts":[1,1,1,0,2,5,9,13,23,48,100,101,217,202,461,749,640,344,434,609,676,264,368,210,282,320,131,124,148,81,107,65,68,68,35,20,34,18,13,6],"edges":[-55.27,-52.05975,-48.849500000000006,-45.639250000000004,-42.429,-39.21875,-36.008500000000005,-32.79825,-29.588000000000005,-26.377750000000006,-23.167500000000004,-19.957250000000002,-16.747000000000007,-13.536750000000005,-10.326500000000003,-7.116250000000008,-3.906000000000006,-0.6957500000000039,2.514499999999991,5.724749999999993,8.934999999999995,12.145249999999997,15.3555,18.565749999999987,21.77599999999999,24.98624999999999,28.196499999999993,31.406749999999995,34.617,37.827249999999985,41.03749999999999,44.24774999999999,47.45799999999999,50.66824999999999,53.878499999999995,57.08875,60.298999999999985,63.50924999999999,66.71949999999998,69.92974999999998,73.14]},"sample":[10.71,5.38,7.65,-9.09,-1.85,-7.66,-0.4,42.32,36.48,5.22,-4.6,-4.05,-13.56,24.05,-4.49,26.0,9.08,-7.85,35.42,30.34,36.3,49.29,-10.1,27.59,-4.14,24.6,-8.49,14.05,-9.33,11.82,12.54,26.0,10.35,2.94,6.81,14.81,-1.73,1.45,-1.57,-7.1,4.65,1.41,53.6,-3.96,53.23,-2.27,9.67,-2.12,4.75,11.47,-10.65,-8.57,1.5,-8.52,-5.8,-8.32,18.19,-5.86,10.19,4.49,41.46,27.71,24.85,-3.49,-4.67,48.25,2.2,27.19,6.94,27.65,9.49,36.22,-4.69,23.55,11.65,11.47,-6.11,23.25,42.41,14.82,9.68,29.7,7.44,42.69,23.79,22.87,17.86,25.0,29.76,-18.74,17.67,54.32,10.87,11.04,49.72,22.41,9.89,9.63,-2.18,42.43,9.93,29.52,7.91,42.26,32.55,-10.15,-5.41,7.71,7.78,1.88,-6.69,11.95,-3.74,5.12,4.21,7.76,9.5,17.22,-4.02,10.93,18.61,-4.91,6.15,6.63,6.56,6.46,5.55,-8.02,10.68,4.62,-4.24,21.77,6.52,-9.28,11.05,8.21,-14.94,11.81,2.47,9.23,14.97,-8.27,9.34,-3.9,19.63,-7.72,21.55,35.77,31.1,22.02,18.78,46.91,-9.16,40.0,-9.03,16.9,3.61,6.36,27.52,36.21,-4.0,6.64,3.97,17.42,2.06,3.68,32.27,12.76,42.07,10.43,9.71,13.83,-3.71,9.85,-3.41,10.06,32.28,3.48,43.56,-18.68,-4.49,36.05,0.92,1.42,-8.23,-7.64,27.94,12.05,19.61,-16.59,-2.89,10.35,10.48,31.83,42.59,-8.41,11.7,-5.59,12.24,10.95,-1.44,-4.03,-9.43,1.72,-9.07,12.92,12.62,27.21,-14.29,-5.37,-6.46,6.49,-5.62,27.19,6.92,12.81,26.45,14.67,-2.43,-4.5,28.38,-11.91,-15.73,6.54,-23.0,-38.58,48.79,42.0,-9.7,-3.7,-1.12,23.59,24.73,-8.39,41.9,19.01,28.05,5.06,-13.5,-17.6,-1.96,-2.33,24.94,51.02,0.86,-4.61,-9.43,61.85,-5.74,4.56,-3.34,25.09,-3.45,-9.23,-13.64,1.75,-4.56,-4.72,-8.87,-5.85,47.31,-5.08,6.51,8.38,-1.88,-5.9,9.33,10.08,-38.29,1.19,9.54,19.79,22.76,-8.18,18.15,6.17,8.21,2.27,24.85,-3.67,45.99,-6.33,5.01,18.63,34.25,10.68,-4.79,10.15,54.19,7.96,-2.26,-4.62,-4.95,-19.81,24.15,-3.58,22.57,-8.41,5.9,26.32,24.2,13.89,18.2,19.33,18.62,20.06,25.97,-16.9,9.32,33.46,-0.53,1.53,1.33,7.29,52.97,-39.29,46.31,-4.68,73.14,-15.26,10.61,10.72,-4.1,9.19,-3.5,6.82,-13.37,5.76,48.22,4.88,-29.71,1.92,-22.28,4.75,26.15,7.3,4.62,5.3,42.92,8.67,7.43,8.84,-8.33,-2.56,35.51,-1.63,10.08,13.59,-3.02,-5.65,23.59,18.72,23.01,-1.9,-26.97,38.39,-6.55,51.84,38.91,18.38,18.14,14.73,15.36,-16.5,21.8,13.35,22.64,36.95,-10.41,-10.18,-14.18,-10.33,-3.25,20.53,8.0,-3.33,2.27,14.46,-1.17,23.68,46.39,-8.2,37.09,-7.17,-6.99,-3.15,6.27,13.48,21.64,-4.44,28.74,4.55,-4.2,-2.66,-3.72,35.78,11.63,9.51,36.38,11.28,57.49,52.13,2.66,-8.27,7.24,48.53,2.58,12.84,-3.28,52.89,-3.99,-5.93,18.66,-7.95,14.33,-6.82,-10.23,21.38,9.85,-8.38,-5.07,8.97,23.16,-6.7,9.07,-8.58,13.21,6.86,-15.23,10.72,10.88,14.67,35.0,10.42,6.64,42.56,-4.8,7.31,22.68,-4.4,-3.35,-3.09,10.85,25.0,-16.73,35.16,15.36,-5.43,20.56,-6.92,-13.89,-15.58,-4.99,6.14,-18.65,0.56,-8.42,-6.15,7.51,-15.42,-18.25,7.4,-21.99,-3.05,-3.63,-14.06,-1.14,-3.2,8.23,-2.39,-19.0,-9.59,-5.62,39.15,-1.94,-3.77,9.45,1.68,-2.21,-3.47,-15.35,-7.86,-4.29,17.37,-6.43,-6.27,65.52,-2.0,16.87,16.73,16.03,17.09,17.34,6.54,23.4,22.8,22.4,-2.64,24.06,17.3]},"kind":"numeric","n":6998,"n_null":0,"n_unique":4048,"null_rate":0.0,"stats":{"iqr":22.939999999999998,"kurtosis":0.47732525329530695,"max":73.14,"mean":8.437130608745356,"median":6.37,"min":-55.27,"n_outliers":149,"outlier_rate":0.02129179765647328,"q1":-4.65,"q3":18.29,"skew":0.6974759120739835,"std":17.9988188867515,"zero_rate":0.0}},{"alerts":[],"column":"lng","extras":{"histogram":{"counts":[11,4,9,11,10,15,94,37,71,257,50,176,150,112,48,21,0,3,95,261,420,687,297,402,211,113,27,73,212,191,242,386,202,437,266,512,597,106,170,12],"edges":[-178.78,-169.82775,-160.8755,-151.92325,-142.971,-134.01875,-125.06649999999999,-116.11425,-107.16199999999999,-98.20974999999999,-89.2575,-80.30524999999999,-71.35299999999998,-62.40074999999999,-53.44849999999998,-44.496249999999975,-35.54399999999998,-26.59174999999999,-17.63949999999997,-8.687249999999977,0.2650000000000148,9.217250000000035,18.169500000000028,27.12175000000002,36.07400000000004,45.02625000000003,53.978500000000025,62.93075000000002,71.88300000000004,80.83525000000006,89.78750000000005,98.73975000000004,107.69200000000004,116.64425000000003,125.59650000000002,134.54875,143.50100000000006,152.45325000000005,161.40550000000005,170.35775000000004,179.31]},"sample":[6.01,-4.53,6.13,142.53,138.16,145.67,15.46,21.38,3.55,-4.43,145.51,142.0,130.04,94.28,144.77,85.53,8.51,-57.91,3.23,42.18,42.0,-106.07,151.0,82.47,144.84,103.71,160.77,108.47,124.26,-15.32,-15.67,64.0,13.61,21.05,24.1,-3.77,105.9,124.85,119.34,143.99,9.25,117.94,56.56,14.1,25.6,138.87,8.81,139.25,16.67,-15.13,123.31,118.44,30.03,142.71,145.35,124.25,104.95,144.09,12.94,29.13,45.08,84.35,106.19,142.5,145.56,-3.79,22.61,92.47,10.2,90.8,11.07,74.82,21.46,106.02,-3.18,5.27,-45.13,105.52,-76.6,-89.24,11.52,80.48,122.19,-124.38,92.33,92.99,-96.52,116.0,118.23,-67.9,-97.24,89.55,103.83,5.54,-124.97,-104.47,-84.12,11.36,40.37,47.44,9.52,66.6,0.6,45.81,75.71,148.45,142.47,-0.43,2.27,29.29,142.66,28.59,140.9,6.37,11.39,9.44,9.3,121.45,143.14,9.25,82.98,-49.02,36.67,2.21,2.03,1.69,-0.3,156.55,14.22,7.34,35.8,77.37,0.17,150.76,35.93,6.69,144.83,5.08,10.25,8.19,107.86,124.52,-1.58,142.85,-155.44,35.73,103.16,-110.53,101.72,100.88,104.77,19.66,18.19,-97.0,-37.14,121.04,34.25,6.31,79.68,44.07,34.85,9.97,9.37,120.7,10.68,102.29,44.24,-15.74,48.26,33.75,12.15,107.26,143.88,7.71,128.53,11.27,77.16,24.82,42.26,122.33,143.59,-118.68,114.45,116.68,123.77,145.41,82.65,105.02,99.34,22.6,141.19,8.13,13.36,-96.5,-121.7,124.43,30.47,145.51,75.92,-73.8,111.91,143.62,150.46,9.74,149.27,75.2,75.11,92.63,167.47,-70.51,145.66,116.85,147.86,86.85,-9.96,106.54,103.33,104.91,102.19,-74.0,84.93,133.72,30.28,10.21,-69.0,146.5,-115.06,74.0,119.34,142.24,23.36,101.55,98.9,123.59,12.45,98.76,89.72,11.11,167.33,168.2,25.33,147.74,99.83,5.88,124.12,16.73,119.19,33.73,146.36,-66.58,151.97,85.33,134.07,148.73,39.53,103.08,129.91,152.21,31.23,151.03,126.56,144.81,18.79,25.9,125.82,150.68,-10.54,9.76,176.54,-58.59,15.8,79.91,92.21,129.83,-96.57,8.24,-5.73,111.76,67.01,142.68,-65.58,147.71,102.05,-98.1,62.28,-14.38,145.42,98.68,42.67,117.03,121.03,121.82,145.6,34.61,90.63,142.96,103.14,-57.69,10.03,94.38,94.13,-89.44,-94.75,-99.8,-99.4,-97.9,102.6,168.57,16.13,51.95,166.92,27.97,18.62,11.31,139.21,175.77,-116.41,141.03,86.21,167.14,12.92,30.0,19.51,92.77,142.25,11.52,19.05,8.28,-121.97,10.35,19.08,30.02,-53.72,6.91,127.78,6.25,31.91,37.02,-76.12,41.44,6.22,117.87,121.72,147.28,71.84,121.27,6.37,105.03,101.69,19.83,103.73,73.37,108.09,11.22,131.36,-99.25,143.92,18.63,-123.66,-97.63,-97.59,-89.74,-90.58,167.78,79.24,-81.37,121.0,-94.66,-76.96,-77.42,-72.67,-76.28,121.06,93.15,10.58,102.43,37.36,107.95,-71.61,92.03,24.23,157.41,49.88,144.18,36.92,130.53,120.54,103.98,100.77,142.37,72.68,-54.02,141.66,132.47,134.45,51.44,-5.88,34.64,43.14,4.41,72.56,4.91,113.84,156.54,0.44,-121.99,34.76,124.0,140.92,6.09,152.77,-48.59,104.37,145.73,22.0,39.13,150.37,104.01,-3.71,124.17,141.73,1.14,-103.98,155.75,-82.96,125.58,99.87,99.7,166.84,-4.53,30.16,-87.04,71.1,-61.42,36.42,-124.29,142.09,0.38,101.77,143.99,141.16,142.03,76.8,67.0,-68.97,72.64,-90.89,145.64,73.3,146.9,167.43,167.27,30.57,11.88,137.61,37.86,143.5,146.51,-59.35,132.6,144.37,-7.25,-63.6,128.84,143.76,141.93,-73.83,144.09,-6.72,12.26,-47.0,-48.26,146.21,69.24,132.1,139.26,10.29,-64.88,139.47,141.97,124.53,147.46,142.95,81.97,141.21,145.02,-171.75,-76.36,-97.19,-95.36,-96.05,-96.89,-96.71,10.17,104.4,108.0,106.9,32.18,93.93,-93.1]},"kind":"numeric","n":6998,"n_null":0,"n_unique":5560,"null_rate":0.0,"stats":{"iqr":115.6525,"kurtosis":-0.6730146994302877,"max":179.31,"mean":52.45887682194913,"median":47.65,"min":-178.78,"n_outliers":12,"outlier_rate":0.0017147756501857674,"q1":8.282499999999999,"q3":123.935,"skew":-0.49824007836862205,"std":79.67324237966837,"zero_rate":0.0}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=+39.45"},{"code":"outliers","level":"warn","message":"16.6% rows beyond 1.5 IQR"}],"column":"p","extras":{"histogram":{"counts":[6943,28,5,12,0,3,1,0,0,2,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1],"edges":[0.0,24113830.0,48227660.0,72341490.0,96455320.0,120569150.0,144682980.0,168796810.0,192910640.0,217024470.0,241138300.0,265252130.0,289365960.0,313479790.0,337593620.0,361707450.0,385821280.0,409935110.0,434048940.0,458162770.0,482276600.0,506390430.0,530504260.0,554618090.0,578731920.0,602845750.0,626959580.0,651073410.0,675187240.0,699301070.0,723414900.0,747528730.0,771642560.0,795756390.0,819870220.0,843984050.0,868097880.0,892211710.0,916325540.0,940439370.0,964553200.0]},"sample":[22000.0,204000.0,4300.0,5000.0,4400.0,2000.0,52000.0,6250000.0,240000.0,53000.0,1000.0,1600.0,0.0,23600.0,3400.0,3900.0,600.0,0.0,38621400.0,14532900.0,12739600.0,5600.0,3000.0,65300.0,2100.0,118000.0,12000.0,302000.0,81000.0,573900.0,144200.0,6476500.0,74000.0,235200.0,13100.0,4200.0,692060.0,11000.0,0.0,500.0,5800.0,19000.0,1655500.0,150000.0,8537300.0,1830.0,1508000.0,2200.0,196000.0,65000.0,9500.0,861000.0,336000.0,1800.0,1300.0,21000.0,4400.0,83000.0,26000.0,2600.0,800.0,12000.0,3655900.0,900.0,2300.0,0.0,815000.0,1400.0,1300.0,23000.0,9100.0,267000.0,343000.0,400.0,138000.0,227000.0,2700.0,260000.0,4050.0,159000.0,52000.0,0.0,1168000.0,0.0,146400.0,69500.0,2300.0,43926200.0,5308000.0,2400.0,0.0,0.0,0.0,47000.0,2100.0,7800.0,15000.0,94000.0,3300.0,699500.0,12000.0,0.0,30000.0,18500.0,536700.0,1900.0,30000.0,15000.0,207000.0,58000.0,300.0,0.0,2600.0,58000.0,418000.0,26000.0,53000.0,8900.0,2400.0,0.0,12000.0,1800.0,83000.0,591000.0,141000.0,1125000.0,152000.0,5100.0,67000.0,197000.0,117000.0,0.0,24000.0,600.0,639000.0,35000.0,800.0,0.0,6500.0,52000.0,7100.0,1800.0,12000.0,13000.0,644000.0,1683000.0,2721000.0,15000.0,63000.0,1100.0,5000.0,11596200.0,1014000.0,54000.0,4400.0,38000.0,17600.0,46000.0,7504000.0,3800.0,106000.0,24000.0,2700.0,17000.0,8100.0,5000.0,0.0,534500.0,107700.0,106500.0,23000.0,6000.0,300.0,38000.0,0.0,46000.0,0.0,13000.0,382400.0,0.0,3900.0,0.0,2300.0,900.0,37000.0,12000.0,0.0,17921600.0,139100.0,9400.0,3600.0,3100.0,8400.0,0.0,0.0,6100.0,166000.0,4800.0,116000.0,21000.0,11000.0,1500.0,2000.0,18000.0,6900.0,0.0,0.0,0.0,300.0,50.0,5900.0,2900.0,9400.0,0.0,948000.0,6100.0,5400.0,521000.0,4500.0,21400.0,0.0,0.0,289000.0,900.0,0.0,0.0,1800.0,6089100.0,35000.0,1400.0,148000.0,51000.0,48000.0,4400.0,0.0,8500.0,3600.0,19000.0,200.0,900.0,241000.0,800.0,177000.0,0.0,0.0,600.0,14000.0,13000.0,1100.0,1100.0,9300.0,4100.0,14000.0,5300.0,477000.0,304000.0,22000.0,6400.0,1109000.0,7100.0,148000.0,100.0,354000.0,0.0,5500.0,6200.0,4969000.0,200.0,674000.0,0.0,354000.0,0.0,248000.0,1100.0,11000.0,273000.0,0.0,1300.0,0.0,11000.0,26900.0,4200.0,200.0,1400.0,0.0,29000.0,1100.0,6900.0,483000.0,27900.0,22000.0,50000.0,100.0,150000.0,99000.0,24000.0,1600.0,12000.0,166000.0,235000.0,0.0,12000.0,36700.0,500.0,2500.0,26000.0,49000.0,6400.0,180000.0,9800.0,6000.0,65000.0,23000.0,127000.0,0.0,0.0,700.0,46000.0,0.0,800.0,12000.0,42000.0,19000.0,27000.0,1900.0,0.0,62000.0,3600.0,0.0,2300.0,0.0,116000.0,0.0,23000.0,1155600.0,16000.0,35800.0,0.0,1950.0,8291000.0,39000.0,14000.0,14000.0,3000.0,24000.0,186000.0,57000.0,2000.0,42000.0,1222000.0,51000.0,0.0,2341000.0,2100.0,3800.0,0.0,20000.0,43314700.0,0.0,11000.0,2900.0,51000.0,186000.0,0.0,0.0,0.0,13000.0,0.0,9300.0,13000.0,257000.0,15000.0,400.0,2893500.0,0.0,414000.0,90000.0,20000.0,0.0,2400.0,23517600.0,20000.0,300.0,3100.0,259000.0,0.0,54000.0,0.0,2100.0,2400.0,8100.0,37700.0,1400.0,2700.0,1500.0,0.0,754000.0,19000.0,253000.0,30000.0,176600.0,15000.0,80.0,5500.0,99000.0,0.0,0.0,245000.0,2500.0,0.0,8200.0,400.0,1500.0,8300.0,539000.0,293000.0,2600.0,0.0,15700.0,4800.0,15000.0,529000.0,13000.0,53000.0,6300.0,445000.0,37000.0,5361600.0,700.0,31000.0,23000.0,23000.0,4800.0,11000.0,25000.0,0.0,700.0,20000.0,29000.0,2300.0,600.0,800.0,0.0,165849500.0,0.0,0.0,5400.0,1600.0,1257000.0,100.0,500.0,900.0,33000.0,47600.0,0.0,22000.0,5200.0,30700.0,49000.0,100.0,0.0,346000.0,5600.0,22000.0,800.0,0.0,14100.0,3100.0,150000.0,58000.0,0.0,3200.0,2500.0,0.0,2200.0,8300.0,0.0,10700.0,900.0,300.0,0.0,2100.0,700.0,0.0,9100.0,22000.0,0.0,0.0,300.0,5800.0,2700.0,7200.0,3900.0,4200.0,109000.0,2049000.0,2146000.0,453000.0,93000.0,16000.0]},"kind":"numeric","n":6998,"n_null":0,"n_unique":1627,"null_rate":0.0,"stats":{"iqr":81800.0,"kurtosis":1870.0128930194041,"max":964553200.0,"mean":1157741.5404401259,"median":11000.0,"min":0.0,"n_outliers":1159,"outlier_rate":0.16561874821377537,"q1":1200.0,"q3":83000.0,"skew":39.451722275175065,"std":17303553.708627757,"zero_rate":0.13460988853958275}},{"alerts":[],"column":"s","extras":{"histogram":{"counts":[250,0,0,0,0,0,0,0,328,0,0,0,0,0,0,0,383,0,0,0,0,0,0,0,1768,0,0,0,0,0,0,0,1176,0,0,0,0,0,0,3093],"edges":[0.0,0.125,0.25,0.375,0.5,0.625,0.75,0.875,1.0,1.125,1.25,1.375,1.5,1.625,1.75,1.875,2.0,2.125,2.25,2.375,2.5,2.625,2.75,2.875,3.0,3.125,3.25,3.375,3.5,3.625,3.75,3.875,4.0,4.125,4.25,4.375,4.5,4.625,4.75,4.875,5.0]},"sample":[5.0,5.0,5.0,5.0,5.0,3.0,4.0,2.0,5.0,5.0,5.0,3.0,1.0,3.0,3.0,4.0,2.0,0.0,5.0,5.0,5.0,3.0,5.0,5.0,2.0,4.0,5.0,5.0,4.0,5.0,5.0,5.0,4.0,5.0,5.0,3.0,1.0,2.0,3.0,5.0,3.0,4.0,4.0,5.0,4.0,4.0,5.0,3.0,5.0,4.0,5.0,5.0,4.0,5.0,5.0,3.0,5.0,5.0,5.0,3.0,2.0,4.0,5.0,3.0,5.0,5.0,5.0,3.0,5.0,4.0,5.0,3.0,5.0,2.0,5.0,5.0,3.0,5.0,2.0,3.0,5.0,3.0,5.0,1.0,4.0,5.0,3.0,5.0,5.0,3.0,4.0,2.0,3.0,4.0,1.0,4.0,5.0,5.0,3.0,4.0,3.0,5.0,5.0,3.0,5.0,5.0,5.0,3.0,5.0,5.0,3.0,2.0,3.0,5.0,5.0,5.0,5.0,5.0,3.0,0.0,3.0,3.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,2.0,4.0,3.0,5.0,4.0,4.0,3.0,4.0,5.0,5.0,5.0,3.0,4.0,3.0,3.0,2.0,5.0,5.0,3.0,5.0,4.0,5.0,5.0,2.0,4.0,4.0,3.0,5.0,3.0,3.0,0.0,5.0,4.0,5.0,5.0,4.0,3.0,5.0,1.0,5.0,3.0,5.0,4.0,1.0,3.0,1.0,5.0,4.0,5.0,5.0,3.0,5.0,5.0,3.0,3.0,5.0,5.0,0.0,0.0,3.0,5.0,5.0,3.0,3.0,4.0,3.0,5.0,5.0,5.0,4.0,3.0,3.0,3.0,2.0,5.0,4.0,5.0,3.0,5.0,4.0,5.0,2.0,4.0,1.0,4.0,2.0,5.0,3.0,0.0,0.0,2.0,5.0,3.0,3.0,5.0,4.0,4.0,5.0,0.0,0.0,5.0,5.0,3.0,3.0,5.0,3.0,5.0,4.0,2.0,2.0,4.0,1.0,5.0,4.0,4.0,5.0,5.0,5.0,5.0,1.0,5.0,5.0,5.0,5.0,1.0,1.0,5.0,3.0,5.0,5.0,5.0,3.0,3.0,1.0,5.0,5.0,5.0,4.0,4.0,5.0,3.0,3.0,3.0,3.0,3.0,5.0,3.0,3.0,0.0,5.0,5.0,3.0,5.0,5.0,4.0,4.0,2.0,5.0,4.0,4.0,4.0,3.0,5.0,4.0,5.0,1.0,5.0,3.0,4.0,5.0,4.0,5.0,5.0,3.0,3.0,5.0,5.0,4.0,2.0,4.0,1.0,4.0,2.0,3.0,3.0,4.0,5.0,4.0,3.0,1.0,5.0,5.0,0.0,3.0,1.0,5.0,2.0,5.0,2.0,5.0,5.0,1.0,1.0,5.0,5.0,5.0,3.0,5.0,4.0,4.0,4.0,2.0,5.0,5.0,4.0,5.0,5.0,3.0,4.0,1.0,5.0,5.0,0.0,4.0,4.0,3.0,4.0,3.0,4.0,3.0,2.0,0.0,2.0,2.0,5.0,2.0,3.0,5.0,5.0,5.0,5.0,4.0,1.0,3.0,5.0,5.0,3.0,5.0,4.0,2.0,5.0,1.0,3.0,3.0,3.0,5.0,4.0,4.0,3.0,3.0,5.0,3.0,3.0,3.0,5.0,4.0,2.0,5.0,5.0,0.0,2.0,5.0,3.0,4.0,5.0,3.0,3.0,5.0,5.0,5.0,5.0,5.0,5.0,3.0,3.0,5.0,4.0,5.0,3.0,5.0,4.0,5.0,4.0,3.0,3.0,3.0,3.0,5.0,3.0,0.0,2.0,4.0,3.0,2.0,5.0,2.0,0.0,5.0,0.0,3.0,3.0,5.0,5.0,2.0,3.0,3.0,4.0,5.0,1.0,4.0,5.0,3.0,4.0,2.0,0.0,5.0,4.0,5.0,2.0,2.0,3.0,3.0,5.0,5.0,0.0,3.0,5.0,4.0,4.0,5.0,1.0,4.0,3.0,3.0,0.0,5.0,3.0,3.0,3.0,5.0,3.0,1.0,3.0,5.0,5.0,3.0,4.0,4.0,4.0,5.0,5.0,4.0,4.0,3.0]},"kind":"numeric","n":6998,"n_null":0,"n_unique":6,"null_rate":0.0,"stats":{"iqr":2.0,"kurtosis":0.41542508642969,"max":5.0,"mean":3.79637039154044,"median":4.0,"min":0.0,"n_outliers":0,"outlier_rate":0.0,"q1":3.0,"q3":5.0,"skew":-1.0409465593602825,"std":1.3659337535181946,"zero_rate":0.03572449271220349}},{"alerts":[],"column":"ss","extras":{"singletons":0,"top_values":[["safe",3074],["definitely endangered",1753],["vulnerable",1160],["severely endangered",374],["critically endangered",327],["extinct",219],["unknown",91]]},"kind":"categorical","n":6998,"n_null":0,"n_unique":7,"null_rate":0.0,"stats":{"cardinality":7,"entropy":2.1216401185475355,"entropy_ratio":0.7557434586833484,"top_rate":0.4392683623892541,"top_value":"safe"}}],"insights":{"errors":[],"insights":[{"confidence":"high","critiques":[],"evidence_keys":["row_count","column_count","stats.median","stats.max","stats.outlier_rate","top_values","top_words","stats.zero_rate"],"featured_charts":[{"caption":"Look at how the 'safe' majority compares to the combined endangered and extinct categories \u2014 nearly half of all languages are at some level of risk.","column":"ss","kind":"donut"},{"caption":"Expect a heavily right-skewed distribution; the vast majority of languages cluster near zero speakers while a tiny number reach hundreds of millions.","column":"p","kind":"histogram"},{"caption":"This numeric status score (0\u20135) shows how languages rank on a vitality scale \u2014 look for the concentration at the higher (safer) end versus the tail of critically low scores.","column":"s","kind":"bar"},{"caption":"The distribution of latitudes skews toward tropical and equatorial regions, revealing where the world's linguistic diversity is geographically concentrated.","column":"lat","kind":"histogram"},{"caption":"Most language names are short single words, but a long tail of compound names (up to 43 characters) reflects complex regional dialect naming conventions.","column":"n","kind":"length"}],"model":"anthropic:default","narrative":"This dataset catalogues approximately 7,000 world languages, each with a name, geographic coordinates, speaker population, and endangerment status. The most striking finding is the extreme inequality in speaker populations: the median language has only 11,000 speakers while the maximum reaches nearly 1 billion, with over 16% of languages flagged as outliers \u2014 a classic long-tail distribution reflecting how a handful of dominant languages vastly outnumber the rest. Equally notable is the endangerment picture: while 44% of languages are classified as 'safe', a substantial share face real risk \u2014 1,753 are 'definitely endangered', 327 are 'critically endangered', and 219 are already extinct. Top words in language names include 'sign', 'zapotec', 'mixtec', and directional qualifiers like 'southern' and 'northern', hinting at rich dialect clustering worth exploring geographically.","scope":"dataset","target":"__global__"},{"confidence":"high","critiques":[],"evidence_keys":["n_unique","n","duplicate_rate","null_rate","one_word_rate","top_words","word_mean","len_mean","vocab_size"],"model":"anthropic:default","narrative":"This column appears to be a name field for human languages or dialects \u2014 top words include 'language', 'sign', 'Zapotec', 'Mixtec', and directional qualifiers like 'southern', 'northern', 'western', 'eastern', 'central', consistent with a linguistic taxonomy dataset. All 6,998 rows are unique with zero duplicates and zero nulls, confirming it functions as a label or identifier. The majority of values (73%) are single words, but multi-word entries push the mean length to ~8.97 characters and mean word count to ~1.37, reflecting compound names like 'Southern Zapotec'. The vocabulary size (7,003) slightly exceeding unique row count (6,998) is unremarkable given tokenization.","role":"label","scope":"column","target":"n","treatment":"Use as a human-readable label; encode as a categorical ID or embed via a language-name lookup for modelling."},{"confidence":"medium","critiques":[],"evidence_keys":["skew","kurtosis","median","mean","max","n_outliers","outlier_rate","zero_rate","iqr","q1","q3"],"model":"anthropic:default","narrative":"Column 'p' is a numeric field likely representing a price, population, or some monetary/count quantity with extreme positive skew (skew = 39.45, kurtosis = 1870.01). The median is 11,000 while the mean is 1,157,741 \u2014 a 100\u00d7 gap \u2014 driven by a long upper tail that reaches 964,553,200, with 1,159 outliers (16.6% of rows). An additional 13.5% of values are exactly zero, suggesting a two-population distribution (absent/zero vs. non-zero values) that may require separate treatment.","role":"feature","scope":"column","target":"p","treatment":"Separate zero and non-zero records, then log1p-transform the non-zero values before modelling; investigate whether zeros are true zeros or missing-data proxies."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","median","q1","q3","n_unique","n","skew","kurtosis","outlier_rate","null_rate"],"model":"anthropic:default","narrative":"This column contains geographic latitude values, spanning from -55.27\u00b0 (southern South America) to 73.14\u00b0 (Arctic latitudes), covering a wide swath of the globe with concentration in tropical and subtropical regions (median 6.37\u00b0, Q1 -4.65\u00b0, Q3 18.29\u00b0). The 4,048 unique values out of 6,998 rows indicates coordinate granularity likely at 2 decimal places, with some location repetition. Mild positive skew (0.697) and near-mesokurtic kurtosis (0.477) confirm most records cluster in equatorial-to-subtropical bands, consistent with datasets heavy in African, South/Southeast Asian, or Latin American records. Only 149 outliers (~2.1%) were flagged, likely corresponding to high-latitude locations in Europe or North America.","role":"feature","scope":"column","target":"lat","treatment":"Pair with a longitude column for geospatial analysis; consider binning into regions or using as-is in spatial models \u2014 do not normalize without care for geographic interpretation."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","mean","median","iqr","kurtosis","n_outliers","skew"],"model":"anthropic:default","narrative":"This column contains geographic longitude values, spanning from -178.78 to 179.31 \u2014 nearly the full valid range of -180 to 180 degrees. The mean (52.45) and median (47.65) both skew toward positive (eastern) longitudes, suggesting the dataset has a higher concentration of locations in Europe, Asia, or Africa than in the Americas. The IQR of 115.65 and low kurtosis (-0.67) indicate a broadly spread, relatively flat distribution across the globe with only 12 outliers flagged.","role":"feature","scope":"column","target":"lng","treatment":"Use as-is for geospatial modelling; consider pairing with latitude and projecting to a coordinate system, or binning into geographic regions as a categorical feature."},{"confidence":"high","critiques":[],"evidence_keys":["n_unique","min","max","median","q1","q3","skew","zero_rate","null_rate"],"model":"anthropic:default","narrative":"This column is almost certainly an ordinal rating or severity score with exactly 6 discrete integer values ranging from 0 to 5. The distribution is notably left-skewed (skew = -1.04), meaning high scores (4\u20135) dominate \u2014 the median is 4.0 and Q3 is 5.0 \u2014 which would surprise an analyst expecting a balanced scale. Only 3.6% of rows are zero, suggesting the lowest value is rare rather than a default or sentinel.","role":"feature","scope":"column","target":"s","treatment":"Treat as ordinal; consider whether to one-hot encode or keep as integer, and note the left-skew may bias tree splits toward high values."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","top_value","top_rate","top_values","entropy_ratio"],"model":"anthropic:default","narrative":"This column encodes a conservation or endangerment status classification, with 7 distinct ordered categories ranging from 'safe' through 'extinct'. The dominant class is 'safe' at 43.9% of 6,998 rows, while 'extinct' accounts for 219 records \u2014 a meaningful but minority signal. Entropy ratio of 0.756 indicates reasonable spread across categories, though the distribution is notably right-skewed toward safer statuses. No nulls are present, and the label set is clean with no obvious noise.","role":"label","scope":"column","target":"ss","treatment":"Ordinal-encode in conservation-severity order (safe < vulnerable < definitely endangered < severely endangered < critically endangered < extinct; treat 'unknown' as missing) before modelling."}],"providers":["anthropic:default"],"total_usage":{"completion_tokens":2159,"prompt_tokens":5638,"total_tokens":7797}},"language_counts":{},"meta":{"generated_at":"2026-06-22T00:13:02+00:00","mode":"full","row_count":6998,"sampled_rows":6998,"seed":42,"source":"/home/coolhand/html/datavis/data_trove/data/quirky/silence_data.json"},"notes":[],"saturn_version":"0.2.0","schema":{"lat":"numeric","lng":"numeric","n":"text","p":"numeric","s":"numeric","ss":"categorical"}}
