{"columns":[{"alerts":[{"code":"long_tail","level":"info","message":"69 singleton categories"}],"column":"name","extras":{"singletons":69,"top_values":[["Semeru",13],["Merapi",8],["Fuego",5],["Kelud",5],["Etna",5],["Mayon",5],["Asamayama",5],["Stromboli",4],["Paluweh",4],["Dieng Volcanic Complex",4],["Lengai, Ol Doinyo",4],["Izu-Oshima",3],["Iliwerung",3],["Toya",3],["Karangetang",3],["Villarrica",3],["Aira",3],["Vesuvius",3],["Tungurahua",2],["Rabaul",2]]},"kind":"categorical","n":200,"n_null":0,"n_unique":111,"null_rate":0.0,"stats":{"cardinality":111,"entropy":6.426665533658912,"entropy_ratio":0.9458746211705251,"top_rate":0.065,"top_value":"Semeru"}},{"alerts":[],"column":"country","extras":{"singletons":9,"top_values":[["Indonesia",57],["Japan",29],["Italy",13],["Philippines",12],["Guatemala",8],["Papua New Guinea",8],["United States",8],["Chile",8],["Russia",7],["Ecuador",4],["Mexico",4],["Tanzania",4],["Cameroon",3],["Iceland",3],["Congo, DRC",3],["Solomon Is.",3],["New Zealand",3],["Nicaragua",2],["Vanuatu",2],["Colombia",2]]},"kind":"categorical","n":200,"n_null":0,"n_unique":33,"null_rate":0.0,"stats":{"cardinality":33,"entropy":3.934319349895732,"entropy_ratio":0.7799389295926186,"top_rate":0.285,"top_value":"Indonesia"}},{"alerts":[],"column":"lat","extras":{"histogram":{"counts":[11,0,3,4,57,24,8,29,6,10,27,7,8,6],"edges":[-41.33,-33.80764285714286,-26.285285714285713,-18.762928571428574,-11.240571428571432,-3.7182142857142892,3.8041428571428497,11.326499999999996,18.848857142857135,26.371214285714274,33.89357142857142,41.415928571428566,48.9382857142857,56.460642857142844,63.983]},"sample":[14.473,-0.171,-1.467,16.72,10.41,-4.08,54.049,19.023,11.446,14.382,-7.54,-4.246,-19.532,-0.38,61.299,12.506,32.761,-7.935,56.653,-4.523,-38.379,37.748,38.789,-7.54,34.724,6.25,-8.108,37.748,4.892,6.25,13.257,-8.532,-0.162,34.094,56.056,-7.25,17.36,17.36,-8.108,-8.32,50.861,46.2,63.983,-4.647,37.748,-7.2,13.33,-8.108,12.769,42.544,-1.52,-11.75,56.056,-8.108,2.781,-0.38,19.421,2.781,36.921,14.473,-8.32,-8.532,-21.244,-10.386,14.473,-39.42,40.827,63.983,-7.54,-8.891,19.077,13.257,-8.108,-2.764,-7.935,3.689,-2.764,-10.386,10.83,14.011,12.3,-8.32,-39.42,-8.108,-8.24,-8.343,-8.343,14.473,9.979,0.81,43.418,-7.54,36.406,-40.59,1.352,32.885,34.724,53.13,55.972,31.577,-40.35,-3.613,-7.54,-8.497,32.885,34.724,-2.38,-7.935,-8.95,-8.991,-8.108,9.203,36.406,2.32,-39.42,-8.532,13.257,36.406,-8.108,-8.108,31.577,40.821,-7.2,38.789,42.544,52.825,-0.92,-8.108,2.781,-2.764,34.094,-7.2,30.484,13.257,-1.408,-4.246,36.406,12.769,30.443,49.12,36.618,14.473,38.789,-7.54,-6.101,37.748,42.063,14.757,-41.33,37.748,-8.32,13.257,-6.101,-7.2,36.404,43.418,-7.32,19.421,-7.54,13.813,38.789,-7.935,19.475,63.633,-38.157,-2.764,13.734,-41.33,-1.467,31.888,-37.52,31.577,-5.575,-8.108,3.689,-16.25,19.514,-1.408,58.266,-8.108,14.011,42.544,-8.108,4.203,12.888,-8.542,-21.338,40.821,40.821,-13.612,-11.75,-38.157,-7.54,30.484,14.757,14.809,13.33,-7.935,36.406,37.647]},"kind":"numeric","n":200,"n_null":0,"n_unique":111,"null_rate":0.0,"stats":{"iqr":40.727000000000004,"kurtosis":-0.4761940082210798,"max":63.983,"mean":10.077915,"median":4.5475,"min":-41.33,"n_outliers":0,"outlier_rate":0.0,"q1":-7.935,"q3":32.792,"skew":0.1985022224411008,"std":24.290385433134364,"zero_rate":0.0}},{"alerts":[],"column":"lon","extras":{"histogram":{"counts":[9,0,2,23,13,0,3,17,10,1,2,66,37,17],"edges":[-175.65,-150.44785714285715,-125.24571428571429,-100.04357142857143,-74.84142857142857,-49.639285714285705,-24.437142857142845,0.7650000000000148,25.967142857142875,51.169285714285735,76.3714285714286,101.57357142857146,126.77571428571432,151.97785714285718,177.18]},"sample":[-90.88,-78.598,-78.442,-62.18,123.13,145.037,159.443,-98.622,-85.515,-90.601,110.446,152.194,169.447,100.474,-152.251,-86.702,130.299,112.314,161.36,129.881,-71.586,14.999,15.213,110.446,139.394,10.5,112.922,14.999,-75.324,10.5,123.685,123.573,121.601,139.526,160.642,108.058,-93.23,-93.23,112.922,121.708,155.565,-122.18,-19.666,145.976,14.999,109.879,-61.18,112.922,124.056,140.839,29.25,43.38,160.642,112.922,125.407,100.474,-155.287,125.407,138.036,-90.88,121.708,123.573,55.708,165.804,-90.88,-71.93,14.139,-19.666,110.446,121.641,122.202,123.685,112.922,35.914,112.314,125.447,35.914,165.804,-85.324,120.998,-61.64,121.708,-71.93,112.922,115.378,115.508,115.508,-90.88,-83.852,127.332,142.686,110.446,138.523,-72.117,124.865,131.085,139.394,-168.693,160.595,130.659,-72.07,144.818,110.446,124.131,131.085,139.394,147.35,112.314,148.15,157.979,112.922,124.673,138.523,-76.4,-71.93,123.573,123.685,138.523,112.922,112.922,130.659,14.426,109.879,15.213,140.839,-169.944,-91.408,112.922,125.407,35.914,139.526,109.879,140.303,123.685,29.2,152.194,138.523,124.056,130.217,154.508,138.528,-90.88,15.213,110.446,105.423,14.999,140.677,-91.552,-72.618,14.999,121.708,123.685,105.423,109.879,25.396,142.686,107.73,-155.287,110.446,-89.633,15.213,112.314,-155.608,-19.083,176.507,35.914,-89.294,-72.618,-78.442,139.918,177.18,130.659,150.516,112.922,125.447,168.12,-103.62,29.2,-155.159,112.922,120.998,140.839,112.922,9.17,40.573,122.775,-175.65,14.426,14.426,-172.525,43.38,176.507,110.446,140.303,-91.552,-61.166,-61.18,112.314,138.523,140.281]},"kind":"numeric","n":200,"n_null":0,"n_unique":111,"null_rate":0.0,"stats":{"iqr":128.28225,"kurtosis":-0.6787804473968224,"max":177.18,"mean":59.155615,"median":112.314,"min":-175.65,"n_outliers":0,"outlier_rate":0.0,"q1":2.10675,"q3":130.389,"skew":-0.8560637954073457,"std":97.9728706166719,"zero_rate":0.0}},{"alerts":[],"column":"elevation","extras":{"histogram":{"counts":[4,17,27,24,27,12,22,23,11,22,3,0,4,4],"edges":[-185.0,213.42857142857144,611.8571428571429,1010.2857142857142,1408.7142857142858,1807.1428571428573,2205.5714285714284,2604.0,3002.4285714285716,3400.857142857143,3799.2857142857147,4197.714285714286,4596.142857142857,4994.571428571428,5393.0]},"sample":[3763.0,4784.0,5023.0,915.0,2422.0,1807.0,1513.0,5393.0,1394.0,2569.0,2910.0,688.0,361.0,2885.0,3374.0,728.0,1483.0,1730.0,3283.0,596.0,2832.0,3357.0,924.0,2910.0,746.0,3011.0,3657.0,3357.0,5279.0,3011.0,2462.0,583.0,404.0,775.0,4754.0,2168.0,1150.0,1150.0,3657.0,875.0,2285.0,2549.0,1490.0,1839.0,3357.0,2565.0,1220.0,3657.0,1535.0,733.0,3470.0,2361.0,4754.0,3657.0,1797.0,2885.0,1222.0,1797.0,2400.0,3763.0,875.0,583.0,2632.0,796.0,3763.0,2847.0,458.0,1490.0,2910.0,618.0,228.0,2462.0,3657.0,2962.0,1730.0,1318.0,2962.0,796.0,1916.0,311.0,-185.0,875.0,2847.0,3657.0,1711.0,2997.0,2997.0,3763.0,3436.0,1714.0,2077.0,2910.0,2568.0,2236.0,1299.0,1592.0,746.0,2149.0,2882.0,1117.0,1114.0,685.0,2910.0,1347.0,1592.0,746.0,270.0,1730.0,1680.0,-20.0,3657.0,1552.0,2568.0,4650.0,2847.0,583.0,2462.0,2568.0,3657.0,3657.0,1117.0,1281.0,2565.0,924.0,733.0,1730.0,1640.0,3657.0,1797.0,2962.0,775.0,2565.0,394.0,2462.0,3058.0,688.0,2568.0,1535.0,657.0,1145.0,2165.0,3763.0,924.0,2910.0,285.0,3357.0,1131.0,3745.0,1974.0,3357.0,875.0,2462.0,285.0,2565.0,367.0,2077.0,2665.0,1222.0,2910.0,1950.0,924.0,1730.0,4170.0,1490.0,1111.0,2962.0,1893.0,1974.0,5023.0,11.0,294.0,1117.0,724.0,3657.0,1318.0,1334.0,3850.0,3058.0,841.0,3657.0,311.0,733.0,3657.0,4095.0,1496.0,1703.0,-68.0,1281.0,1281.0,1858.0,2361.0,1111.0,2910.0,394.0,3745.0,1372.0,1220.0,1730.0,2568.0,1728.0]},"kind":"numeric","n":200,"n_null":0,"n_unique":109,"null_rate":0.0,"stats":{"iqr":1809.75,"kurtosis":-0.573758006002973,"max":5393.0,"mean":2074.21,"median":1848.5,"min":-185.0,"n_outliers":0,"outlier_rate":0.0,"q1":1113.25,"q3":2923.0,"skew":0.38795589927817015,"std":1235.0710702802555,"zero_rate":0.0}},{"alerts":[],"column":"type","extras":{"singletons":4,"top_values":[["Stratovolcano",139],["Complex volcano",22],["Shield volcano",12],["Caldera",9],["Submarine volcano",4],["Pyroclastic shield",3],["Lava dome",3],["Maar",2],["Tuff cone",2],["Cinder cone",1],["Compound volcano",1],["Pyroclastic cone",1],["Subglacial volcano",1]]},"kind":"categorical","n":200,"n_null":0,"n_unique":13,"null_rate":0.0,"stats":{"cardinality":13,"entropy":1.740361416051977,"entropy_ratio":0.47031205711040297,"top_rate":0.695,"top_value":"Stratovolcano"}},{"alerts":[{"code":"outliers","level":"warn","message":"7.5% rows beyond 1.5 IQR"}],"column":"vei","extras":{"histogram":{"counts":[7,0,15,0,77,0,0,70,0,23,0,6,0,2],"edges":[0.0,0.42857142857142855,0.8571428571428571,1.2857142857142856,1.7142857142857142,2.142857142857143,2.571428571428571,3.0,3.4285714285714284,3.8571428571428568,4.285714285714286,4.714285714285714,5.142857142857142,5.571428571428571,6.0]},"sample":[2.0,3.0,3.0,3.0,2.0,3.0,2.0,3.0,2.0,3.0,3.0,3.0,3.0,2.0,4.0,3.0,1.0,4.0,3.0,3.0,3.0,2.0,2.0,2.0,3.0,3.0,3.0,1.0,3.0,2.0,3.0,1.0,4.0,3.0,2.0,4.0,5.0,5.0,3.0,2.0,2.0,5.0,3.0,2.0,3.0,1.0,3.0,3.0,2.0,3.0,1.0,1.0,3.0,2.0,2.0,2.0,0.0,3.0,2.0,4.0,3.0,2.0,2.0,2.0,3.0,2.0,2.0,3.0,2.0,3.0,2.0,3.0,3.0,3.0,4.0,4.0,4.0,3.0,3.0,4.0,0.0,2.0,2.0,2.0,2.0,5.0,3.0,3.0,3.0,2.0,3.0,3.0,2.0,3.0,2.0,2.0,2.0,2.0,5.0,3.0,4.0,2.0,2.0,0.0,2.0,1.0,0.0,4.0,4.0,2.0,1.0,3.0,2.0,2.0,3.0,2.0,2.0,2.0,2.0,2.0,2.0,3.0,2.0,2.0,2.0,3.0,3.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,1.0,4.0,3.0,2.0,4.0,5.0,3.0,4.0,3.0,3.0,2.0,1.0,4.0,3.0,3.0,1.0,3.0,3.0,2.0,2.0,2.0,3.0,1.0,2.0,2.0,3.0,3.0,4.0,0.0,4.0,1.0,3.0,3.0,3.0,4.0,0.0,2.0,4.0,3.0,2.0,2.0,3.0,4.0,3.0,6.0,3.0,3.0,2.0,2.0,2.0,2.0,2.0,0.0,3.0,2.0,2.0,2.0,1.0,2.0,3.0,6.0,4.0,4.0,3.0,2.0,2.0]},"kind":"numeric","n":200,"n_null":0,"n_unique":7,"null_rate":0.0,"stats":{"iqr":1.0,"kurtosis":0.8382004608241127,"max":6.0,"mean":2.565,"median":3.0,"min":0.0,"n_outliers":15,"outlier_rate":0.075,"q1":2.0,"q3":3.0,"skew":0.21438660626708045,"std":1.0684018027223192,"zero_rate":0.035}},{"alerts":[],"column":"year","extras":{"histogram":{"counts":[16,14,12,9,12,10,14,15,15,17,16,21,13,16],"edges":[1900.0,1907.0714285714287,1914.142857142857,1921.2142857142858,1928.2857142857142,1935.357142857143,1942.4285714285713,1949.5,1956.5714285714287,1963.642857142857,1970.7142857142858,1977.7857142857142,1984.857142857143,1991.9285714285713,1999.0]},"sample":[1999.0,1999.0,1999.0,1997.0,1996.0,1996.0,1996.0,1996.0,1996.0,1995.0,1994.0,1994.0,1994.0,1992.0,1992.0,1992.0,1991.0,1990.0,1990.0,1988.0,1988.0,1987.0,1986.0,1986.0,1986.0,1986.0,1985.0,1985.0,1985.0,1984.0,1984.0,1983.0,1983.0,1983.0,1983.0,1982.0,1982.0,1982.0,1981.0,1981.0,1981.0,1980.0,1980.0,1979.0,1979.0,1979.0,1979.0,1978.0,1978.0,1978.0,1977.0,1977.0,1977.0,1976.0,1976.0,1975.0,1975.0,1974.0,1974.0,1974.0,1973.0,1973.0,1972.0,1971.0,1971.0,1971.0,1970.0,1970.0,1969.0,1969.0,1969.0,1968.0,1967.0,1967.0,1966.0,1966.0,1966.0,1966.0,1966.0,1965.0,1965.0,1964.0,1964.0,1963.0,1963.0,1963.0,1963.0,1963.0,1963.0,1962.0,1962.0,1961.0,1961.0,1960.0,1958.0,1957.0,1957.0,1957.0,1956.0,1955.0,1955.0,1954.0,1954.0,1953.0,1953.0,1953.0,1953.0,1951.0,1951.0,1951.0,1950.0,1950.0,1950.0,1949.0,1949.0,1948.0,1947.0,1947.0,1946.0,1946.0,1946.0,1944.0,1944.0,1944.0,1944.0,1944.0,1943.0,1941.0,1940.0,1940.0,1940.0,1939.0,1939.0,1938.0,1938.0,1937.0,1936.0,1933.0,1933.0,1933.0,1932.0,1932.0,1930.0,1930.0,1930.0,1929.0,1929.0,1929.0,1929.0,1928.0,1928.0,1928.0,1928.0,1928.0,1926.0,1926.0,1924.0,1924.0,1920.0,1920.0,1919.0,1919.0,1919.0,1918.0,1917.0,1917.0,1917.0,1917.0,1916.0,1915.0,1914.0,1914.0,1914.0,1913.0,1913.0,1913.0,1913.0,1912.0,1912.0,1911.0,1911.0,1910.0,1909.0,1909.0,1907.0,1907.0,1907.0,1906.0,1905.0,1905.0,1904.0,1903.0,1902.0,1902.0,1902.0,1902.0,1902.0,1901.0,1900.0,1900.0]},"kind":"numeric","n":200,"n_null":0,"n_unique":84,"null_rate":0.0,"stats":{"iqr":49.25,"kurtosis":-1.1688445737601993,"max":1999.0,"mean":1952.295,"median":1955.0,"min":1900.0,"n_outliers":0,"outlier_rate":0.0,"q1":1928.0,"q3":1977.25,"skew":-0.21342867893143286,"std":28.791364824235256,"zero_rate":0.0}},{"alerts":[],"column":"last_eruption","extras":{"histogram":{"counts":[16,14,12,9,12,10,14,15,15,17,16,21,13,16],"edges":[1900.0,1907.0714285714287,1914.142857142857,1921.2142857142858,1928.2857142857142,1935.357142857143,1942.4285714285713,1949.5,1956.5714285714287,1963.642857142857,1970.7142857142858,1977.7857142857142,1984.857142857143,1991.9285714285713,1999.0]},"sample":[1999.0,1999.0,1999.0,1997.0,1996.0,1996.0,1996.0,1996.0,1996.0,1995.0,1994.0,1994.0,1994.0,1992.0,1992.0,1992.0,1991.0,1990.0,1990.0,1988.0,1988.0,1987.0,1986.0,1986.0,1986.0,1986.0,1985.0,1985.0,1985.0,1984.0,1984.0,1983.0,1983.0,1983.0,1983.0,1982.0,1982.0,1982.0,1981.0,1981.0,1981.0,1980.0,1980.0,1979.0,1979.0,1979.0,1979.0,1978.0,1978.0,1978.0,1977.0,1977.0,1977.0,1976.0,1976.0,1975.0,1975.0,1974.0,1974.0,1974.0,1973.0,1973.0,1972.0,1971.0,1971.0,1971.0,1970.0,1970.0,1969.0,1969.0,1969.0,1968.0,1967.0,1967.0,1966.0,1966.0,1966.0,1966.0,1966.0,1965.0,1965.0,1964.0,1964.0,1963.0,1963.0,1963.0,1963.0,1963.0,1963.0,1962.0,1962.0,1961.0,1961.0,1960.0,1958.0,1957.0,1957.0,1957.0,1956.0,1955.0,1955.0,1954.0,1954.0,1953.0,1953.0,1953.0,1953.0,1951.0,1951.0,1951.0,1950.0,1950.0,1950.0,1949.0,1949.0,1948.0,1947.0,1947.0,1946.0,1946.0,1946.0,1944.0,1944.0,1944.0,1944.0,1944.0,1943.0,1941.0,1940.0,1940.0,1940.0,1939.0,1939.0,1938.0,1938.0,1937.0,1936.0,1933.0,1933.0,1933.0,1932.0,1932.0,1930.0,1930.0,1930.0,1929.0,1929.0,1929.0,1929.0,1928.0,1928.0,1928.0,1928.0,1928.0,1926.0,1926.0,1924.0,1924.0,1920.0,1920.0,1919.0,1919.0,1919.0,1918.0,1917.0,1917.0,1917.0,1917.0,1916.0,1915.0,1914.0,1914.0,1914.0,1913.0,1913.0,1913.0,1913.0,1912.0,1912.0,1911.0,1911.0,1910.0,1909.0,1909.0,1907.0,1907.0,1907.0,1906.0,1905.0,1905.0,1904.0,1903.0,1902.0,1902.0,1902.0,1902.0,1902.0,1901.0,1900.0,1900.0]},"kind":"numeric","n":200,"n_null":0,"n_unique":84,"null_rate":0.0,"stats":{"iqr":49.25,"kurtosis":-1.1688445737601993,"max":1999.0,"mean":1952.295,"median":1955.0,"min":1900.0,"n_outliers":0,"outlier_rate":0.0,"q1":1928.0,"q3":1977.25,"skew":-0.21342867893143286,"std":28.791364824235256,"zero_rate":0.0}}],"insights":{"errors":[],"insights":[{"confidence":"high","critiques":[],"evidence_keys":["row_count","column_count","country.top_value","country.top_rate","name.top_value","name.top_values","type.top_value","type.top_rate","vei.n_outliers","vei.max","vei.mean","year.min","year.max"],"featured_charts":[{"caption":"Look for Indonesia's outsized dominance over all other countries \u2014 it dwarfs even second-place Japan (29 records).","column":"country","kind":"bar"},{"caption":"Stratovolcanoes account for nearly 70% of records; check how thin the slices are for all other volcano types combined.","column":"type","kind":"donut"},{"caption":"Most eruptions cluster between VEI 2 and 3, but watch for the long right tail where 15 outliers reach up to VEI 6.","column":"vei","kind":"histogram"},{"caption":"Elevation spans from below sea level to over 5,000 m \u2014 look for the broad spread and any clustering around mid-range peaks.","column":"elevation","kind":"histogram"},{"caption":"Eruption records span the entire 20th century; check whether the distribution is roughly uniform or shows reporting gaps in early decades.","column":"year","kind":"histogram"}],"model":"anthropic:default","narrative":"This dataset captures 200 volcanic eruption records across 33 countries, covering events from 1900 to 1999, with 9 attributes including eruption intensity, volcano type, elevation, and geographic coordinates. The most striking feature is the heavy geographic concentration \u2014 Indonesia alone accounts for 28.5% of all records (57 out of 200), with Semeru appearing 13 times as the single most frequent volcano. Volcano type is strongly skewed toward stratovolcanoes, which make up 69.5% of all records, so the 'type' breakdown is worth examining to understand how rare other forms like calderas or shield volcanoes are by comparison. The Volcanic Explosivity Index (VEI) flags 15 outliers at the high end, with a maximum of 6.0 against a mean of 2.6, suggesting a small number of exceptionally powerful eruptions that deserve individual attention.","scope":"dataset","target":"__global__"},{"confidence":"high","critiques":[],"evidence_keys":["n_unique","min","max","median","q1","q3","iqr","n_outliers","outlier_rate","zero_rate"],"model":"anthropic:default","narrative":"This column is almost certainly the Volcanic Explosivity Index (VEI), a logarithmic scale rating volcanic eruption intensity. With only 7 unique integer values ranging from 0 to 6 and a median of 3, it behaves more like an ordinal category than a continuous numeric. Notably, 15 outliers (7.5% of rows) sit at the upper end of the scale \u2014 VEI 5\u20136 events are rare in real-world volcanology, so their presence is worth verifying. The IQR of 1.0 and tight Q1\u2013Q3 band of 2\u20133 confirm most eruptions cluster at moderate intensity.","role":"feature","scope":"column","target":"vei","treatment":"Treat as ordinal; consider one-hot or ordinal encoding rather than raw numeric use in models."},{"confidence":"high","critiques":[],"evidence_keys":["top_value","top_rate","n_unique","n","entropy_ratio","alerts","top_values"],"model":"anthropic:default","narrative":"This column contains volcano names, functioning as a label for individual volcanic entities in the dataset. With 111 unique values across 200 rows, many volcanoes appear multiple times \u2014 'Semeru' leads with 13 occurrences (6.5% of rows), suggesting repeated eruption or activity events per volcano rather than one row per volcano. The high entropy ratio of 0.946 combined with the long-tail alert indicates the distribution is broad but uneven, with a handful of well-known volcanoes (Semeru, Merapi, Etna, Stromboli) dominating while most names appear only once or twice.","role":"label","scope":"column","target":"name","treatment":"Group by this column to aggregate per-volcano statistics, or encode as a categorical feature with frequency-based or target encoding given the long-tail distribution."},{"confidence":"high","critiques":[],"evidence_keys":["stats.min","stats.max","stats.mean","stats.median","stats.iqr","stats.skew","stats.kurtosis","n_unique","n","null_rate"],"model":"anthropic:default","narrative":"This column represents geographic elevation in metres (or feet) for 200 location records, spanning from -185.0 (below sea level, consistent with places like the Dead Sea or Death Valley) to 5393.0 (alpine/high-altitude terrain). The distribution is broad and fairly flat \u2014 IQR of 1809.75 against a mean of 2074.21 \u2014 with a slight positive skew (0.39) and near-platykurtic shape (kurtosis -0.57), suggesting a deliberately diverse geographic sample rather than a natural population draw. With only 109 unique values across 200 rows, roughly 45% of values are repeated, which may indicate rounding to nearest metre or binned elevation bands.","role":"feature","scope":"column","target":"elevation","treatment":"Use as-is or apply mild normalisation (e.g. standard scaling); the negative minimum requires care if log-transforming \u2014 shift first."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","mean","median","kurtosis","skew","n_unique","n","null_rate","n_outliers"],"model":"anthropic:default","narrative":"This column almost certainly records the year of a volcano's last known eruption, ranging from 1900 to 1999 with a mean of 1952.3 and median of 1955 \u2014 consistent with a dataset scoped to the 20th century. The distribution is notably platykurtic (kurtosis \u2248 \u22121.17), meaning eruption years are spread fairly uniformly across the century rather than clustering tightly around any single period. With only 84 unique values across 200 rows, many volcanoes share the same recorded eruption year, which is unsurprising given that annual granularity naturally produces ties. No nulls, no outliers, and near-zero skew make this a clean numeric feature.","role":"feature","scope":"column","target":"last_eruption","treatment":"Use as-is or engineer recency features (e.g., years since eruption relative to a reference year); no transformation needed given near-uniform distribution."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","n_unique","n","stats.skew","stats.kurtosis","stats.iqr","null_rate","outlier_rate","zero_rate"],"model":"anthropic:default","narrative":"This column contains geographic latitude values, spanning from -41.33\u00b0 (southern hemisphere, e.g., southern South America or New Zealand) to 63.983\u00b0 (northern hemisphere, e.g., Scandinavia or Canada), consistent with a globally distributed dataset. With only 111 unique values across 200 rows, many locations are repeated, suggesting the dataset references a limited set of geographic points rather than unique coordinates per record. The distribution is nearly symmetric (skew 0.20, kurtosis -0.48) and spans a wide IQR of 40.73\u00b0, indicating broad global coverage rather than clustering in one region. No nulls, outliers, or zeros are present.","role":"feature","scope":"column","target":"lat","treatment":"Pair with a longitude column for geospatial analysis; consider binning into regions or using as-is in spatial models."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","mean","median","skew","n_unique","n","null_rate"],"model":"anthropic:default","narrative":"This column is a geographic longitude coordinate, spanning the full valid range of \u2212175.65 to 177.18 degrees, indicating global coverage. Surprisingly, with only 111 unique values across 200 rows (~55% uniqueness), there is notable coordinate repetition, suggesting many records share the same location or coordinates have been rounded/binned. The mean (59.16) is substantially pulled away from the median (112.31) by a left skew (\u22120.86), implying a cluster of observations in Eastern hemisphere longitudes with a tail of negative (Western hemisphere) values dragging the mean down.","role":"feature","scope":"column","target":"lon","treatment":"Use as-is or pair with latitude for geospatial modelling; investigate duplicate coordinates (111 unique / 200 rows) to determine if binning or data quality issue."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","n_unique","n","null_rate","kurtosis","skew","q1","q3","iqr","median","mean"],"model":"anthropic:default","narrative":"This column represents a calendar year, spanning 1900 to 1999 \u2014 exactly one century of data with no nulls. With 84 unique values across 200 rows, some years appear multiple times, suggesting records grouped by year rather than unique annual entries. The distribution is notably flat (kurtosis \u2248 \u22121.17) and nearly symmetric (skew \u2248 \u22120.21), with the bulk of records concentrated between 1928 and 1977 (IQR = 49.25 years), which is surprisingly wide and uniform for a year field.","role":"feature","scope":"column","target":"year","treatment":"Use as an ordinal or numeric feature; consider binning into decades if cardinality reduction is needed."},{"confidence":"high","critiques":[],"evidence_keys":["top_value","top_rate","n_unique","null_rate","entropy_ratio","top_values","n"],"model":"anthropic:default","narrative":"This column records the country associated with each record \u2014 likely the location of a seismic, volcanic, or natural-disaster event given the top countries (Indonesia, Japan, Philippines, Papua New Guinea, Chile). Indonesia dominates heavily at 28.5% of all 200 rows (57 occurrences), followed by Japan at 14.5%, which is a pronounced geographic skew toward the Pacific Ring of Fire. With only 33 unique values and zero nulls, coverage is clean, but the top-heavy distribution (entropy ratio 0.78) means most records cluster around a handful of high-activity nations.","role":"label","scope":"column","target":"country","treatment":"One-hot encode or target-encode for modelling; be aware of class imbalance with Indonesia representing 28.5% of rows."},{"confidence":"high","critiques":[],"evidence_keys":["top_value","top_rate","cardinality","n","entropy_ratio","top_values","null_rate"],"model":"anthropic:default","narrative":"This column classifies volcanic structures into 13 morphological types, making it a geological label for each record. 'Stratovolcano' dominates heavily at 69.5% of 200 records (139 occurrences), while the remaining 12 types share the rest \u2014 an extreme concentration that yields an entropy ratio of only 0.47. The long tail of rare categories (e.g., 'Cinder cone' and 'Maar' each appearing \u22642 times) may cause class-imbalance problems in any supervised modelling task.","role":"label","scope":"column","target":"type","treatment":"One-hot encode or target-encode with caution due to severe class imbalance; consider grouping rare types (frequency < 3) into an 'Other' category before modelling."}],"providers":["anthropic:default"],"total_usage":{"completion_tokens":2990,"prompt_tokens":7792,"total_tokens":10782}},"language_counts":{},"meta":{"generated_at":"2026-06-22T00:26:41+00:00","mode":"full","row_count":200,"sampled_rows":200,"seed":42,"source":"/home/coolhand/html/datavis/data_trove/data/quirky/volcanoes.json"},"notes":[],"saturn_version":"0.2.0","schema":{"country":"categorical","elevation":"numeric","last_eruption":"numeric","lat":"numeric","lon":"numeric","name":"categorical","type":"categorical","vei":"numeric","year":"numeric"}}
