{"columns":[{"alerts":[{"code":"long_tail","level":"info","message":"8 singleton categories"}],"column":"name","extras":{"singletons":8,"top_values":[["Mercury",1],["Venus",1],["Earth",1],["Mars",1],["Jupiter",1],["Saturn",1],["Uranus",1],["Neptune",1]]},"kind":"categorical","n":8,"n_null":0,"n_unique":8,"null_rate":0.0,"stats":{"cardinality":8,"entropy":3.0,"entropy_ratio":1.0,"top_rate":0.125,"top_value":"Mercury"}},{"alerts":[],"column":"classification","extras":{"singletons":0,"top_values":[["Inner Planet",4],["Outer Planet",4]]},"kind":"categorical","n":8,"n_null":0,"n_unique":2,"null_rate":0.0,"stats":{"cardinality":2,"entropy":1.0,"entropy_ratio":1.0,"top_rate":0.5,"top_value":"Inner Planet"}},{"alerts":[],"column":"type","extras":{"singletons":0,"top_values":[["terrestrial",4],["gas_giant",2],["ice_giant",2]]},"kind":"categorical","n":8,"n_null":0,"n_unique":3,"null_rate":0.0,"stats":{"cardinality":3,"entropy":1.5,"entropy_ratio":0.9463946303571862,"top_rate":0.5,"top_value":"terrestrial"}},{"alerts":[],"column":"diameter_km","extras":{"histogram":{"counts":[4,2,0,0,2],"edges":[4879.0,32500.0,60121.0,87742.0,115363.0,142984.0]},"sample":[4879.0,12104.0,12756.0,6792.0,142984.0,120536.0,51118.0,49528.0]},"kind":"numeric","n":8,"n_null":0,"n_unique":8,"null_rate":0.0,"stats":{"iqr":57696.5,"kurtosis":-0.8589363054601247,"max":142984.0,"mean":50087.125,"median":31142.0,"min":4879.0,"n_outliers":0,"outlier_rate":0.0,"q1":10776.0,"q3":68472.5,"skew":0.8486526956719965,"std":53916.366175342075,"zero_rate":0.0}},{"alerts":[{"code":"outliers","level":"warn","message":"25.0% rows beyond 1.5 IQR"}],"column":"mass_earth","extras":{"histogram":{"counts":[6,1,0,0,1],"edges":[0.0553,63.604240000000004,127.15318,190.70211999999998,254.25106,317.8]},"sample":[0.0553,0.815,1.0,0.107,317.8,95.2,14.5,17.1]},"kind":"numeric","n":8,"n_null":0,"n_unique":8,"null_rate":0.0,"stats":{"iqr":35.987,"kurtosis":2.1877326942222215,"max":317.8,"mean":55.822162500000005,"median":7.75,"min":0.0553,"n_outliers":2,"outlier_rate":0.25,"q1":0.6379999999999999,"q3":36.625,"skew":1.945258972853673,"std":110.60567546964742,"zero_rate":0.0}},{"alerts":[{"code":"outliers","level":"warn","message":"12.5% rows beyond 1.5 IQR"}],"column":"semi_major_axis_au","extras":{"histogram":{"counts":[5,1,0,1,1],"edges":[0.38709927,6.323663968,12.260228666,18.196793364,24.133358062,30.06992276]},"sample":[0.38709927,0.72333566,1.00000261,1.52371034,5.202887,9.53667594,19.18916464,30.06992276]},"kind":"numeric","n":8,"n_null":0,"n_unique":8,"null_rate":0.0,"stats":{"iqr":11.0189622425,"kurtosis":-0.10495450721924371,"max":30.06992276,"mean":8.4540997775,"median":3.36329867,"min":0.38709927,"n_outliers":1,"outlier_rate":0.125,"q1":0.9308358724999999,"q3":11.949798115,"skew":1.1471415647677028,"std":10.840814741729014,"zero_rate":0.0}},{"alerts":[{"code":"outliers","level":"warn","message":"12.5% rows beyond 1.5 IQR"}],"column":"eccentricity","extras":{"histogram":{"counts":[3,3,1,0,1],"edges":[0.00677672,0.046548562,0.086320404,0.12609224600000002,0.16586408800000002,0.20563593]},"sample":[0.20563593,0.00677672,0.01671123,0.0933941,0.04838624,0.05386179,0.04725744,0.00859048]},"kind":"numeric","n":8,"n_null":0,"n_unique":8,"null_rate":0.0,"stats":{"iqr":0.049063825,"kurtosis":1.164689721149288,"max":0.20563593,"mean":0.060076741249999996,"median":0.04782184,"min":0.00677672,"n_outliers":1,"outlier_rate":0.125,"q1":0.0146810425,"q3":0.0637448675,"skew":1.4949078874770414,"std":0.06547567342741696,"zero_rate":0.0}},{"alerts":[{"code":"outliers","level":"warn","message":"12.5% rows beyond 1.5 IQR"}],"column":"inclination_deg","extras":{"histogram":{"counts":[3,3,1,0,1],"edges":[1.531e-05,1.4010080520000001,2.8020007940000005,4.202993536000001,5.603986278000001,7.00497902]},"sample":[7.00497902,3.39467605,1.531e-05,1.84969142,1.30439695,2.48599187,0.77263783,1.77004347]},"kind":"numeric","n":8,"n_null":0,"n_unique":8,"null_rate":0.0,"stats":{"iqr":1.5417057449999998,"kurtosis":0.9324541934645634,"max":7.00497902,"mean":2.32280399,"median":1.809867445,"min":1.531e-05,"n_outliers":1,"outlier_rate":0.125,"q1":1.17145717,"q3":2.713162915,"skew":1.319584025594446,"std":2.1535086977758136,"zero_rate":0.0}},{"alerts":[],"column":"ascending_node_deg","extras":{"histogram":{"counts":[1,2,2,1,2],"edges":[0.0,26.356845148,52.713690296,79.070535444,105.427380592,131.78422574]},"sample":[48.33076593,76.67984255,0.0,49.55953891,100.47390909,113.66242448,74.01692503,131.78422574]},"kind":"numeric","n":8,"n_null":0,"n_unique":8,"null_rate":0.0,"stats":{"iqr":54.51869227250001,"kurtosis":-0.6348658975948283,"max":131.78422574,"mean":74.31345396625,"median":75.34838379,"min":0.0,"n_outliers":0,"outlier_rate":0.0,"q1":49.252345665,"q3":103.77103793750001,"skew":-0.35942676881674585,"std":42.00617990925109,"zero_rate":0.125}},{"alerts":[],"column":"argument_perihelion_deg","extras":{"histogram":{"counts":[2,2,0,2,2],"edges":[29.12703035,91.179953748,153.23287714600002,215.28580054399998,277.338723942,339.39164734]},"sample":[29.12703035,54.89223617,102.93768193,286.50207128,273.86774079,339.39164734,96.99854424,272.84981044]},"kind":"numeric","n":8,"n_null":0,"n_unique":8,"null_rate":0.0,"stats":{"iqr":190.55435619000002,"kurtosis":-1.7245338654557145,"max":339.39164734,"mean":182.07084531750002,"median":187.893746185,"min":29.12703035,"n_outliers":0,"outlier_rate":0.0,"q1":86.4719672225,"q3":277.0263234125,"skew":-0.015846923225698993,"std":122.7010125420869,"zero_rate":0.0}},{"alerts":[],"column":"mean_anomaly_deg","extras":{"histogram":{"counts":[3,1,2,1,1],"edges":[19.38696678,78.913650982,138.440335184,197.96701938599998,257.49370358799996,317.02038779]},"sample":[174.79252722,50.11527928,100.46457166,19.38696678,20.02082574,317.02038779,142.28381088,256.22833004]},"kind":"numeric","n":8,"n_null":0,"n_unique":8,"null_rate":0.0,"stats":{"iqr":152.55981203,"kurtosis":-1.067975364912057,"max":317.02038779,"mean":135.03908742375,"median":121.37419127000001,"min":19.38696678,"n_outliers":0,"outlier_rate":0.0,"q1":42.591665895000006,"q3":195.151477925,"skew":0.4780136853031362,"std":109.83683487178708,"zero_rate":0.0}},{"alerts":[{"code":"outliers","level":"warn","message":"12.5% rows beyond 1.5 IQR"}],"column":"orbital_period_years","extras":{"histogram":{"counts":[6,0,1,0,1],"edges":[0.2408467,33.150941360000004,66.06103602000002,98.97113068000003,131.88122534000001,164.79132]},"sample":[0.2408467,0.61519726,1.0000174,1.8808476,11.862615,29.447498,84.016846,164.79132]},"kind":"numeric","n":8,"n_null":0,"n_unique":8,"null_rate":0.0,"stats":{"iqr":42.186022635,"kurtosis":0.7640082670484123,"max":164.79132,"mean":36.731898495,"median":6.8717313,"min":0.2408467,"n_outliers":1,"outlier_rate":0.125,"q1":0.903812365,"q3":43.089835,"skew":1.4858168500439484,"std":59.081059925143556,"zero_rate":0.0}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=-2.02"},{"code":"outliers","level":"warn","message":"25.0% rows beyond 1.5 IQR"}],"column":"rotation_period_days","extras":{"histogram":{"counts":[1,0,0,0,7],"edges":[-243.025,-182.69080000000002,-122.35660000000001,-62.02240000000003,-1.6882000000000232,58.646]},"sample":[58.646,-243.025,0.99726968,1.025957,0.41354,0.44401,-0.71833,0.67125]},"kind":"numeric","n":8,"n_null":0,"n_unique":8,"null_rate":0.0,"stats":{"iqr":0.87386901,"kurtosis":2.6378894254659064,"max":58.646,"mean":-22.693162915000002,"median":0.5576300000000001,"min":-243.025,"n_outliers":2,"outlier_rate":0.25,"q1":0.13057249999999998,"q3":1.00444151,"skew":-2.0216681687953524,"std":91.32676705548657,"zero_rate":0.0}},{"alerts":[{"code":"outliers","level":"warn","message":"12.5% rows beyond 1.5 IQR"}],"column":"perihelion_distance_au","extras":{"histogram":{"counts":[5,1,0,1,1],"edges":[0.30749951,6.2082708019999995,12.109042094,18.009813385999998,23.910584678,29.81135597]},"sample":[0.30749951,0.7184327,0.98329134,1.38133346,4.95155843,9.02063224,18.28254178,29.81135597]},"kind":"numeric","n":8,"n_null":0,"n_unique":8,"null_rate":0.0,"stats":{"iqr":10.419032945,"kurtosis":0.03886125285406061,"max":29.81135597,"mean":8.18208067875,"median":3.1664459450000004,"min":0.30749951,"n_outliers":1,"outlier_rate":0.125,"q1":0.91707668,"q3":11.336109624999999,"skew":1.1977900561348072,"std":10.668860611371056,"zero_rate":0.0}},{"alerts":[{"code":"outliers","level":"warn","message":"12.5% rows beyond 1.5 IQR"}],"column":"aphelion_distance_au","extras":{"histogram":{"counts":[5,1,0,1,1],"edges":[0.46669903,6.439057134,12.411415238,18.383773341999998,24.356131446,30.32848955]},"sample":[0.46669903,0.72823862,1.01671388,1.66608722,5.45421557,10.05271964,20.0957875,30.32848955]},"kind":"numeric","n":8,"n_null":0,"n_unique":8,"null_rate":0.0,"stats":{"iqr":11.61889154,"kurtosis":-0.2379626621635489,"max":30.32848955,"mean":8.72611887625,"median":3.560151395,"min":0.46669903,"n_outliers":1,"outlier_rate":0.125,"q1":0.9445950649999999,"q3":12.563486605,"skew":1.09972025092023,"std":11.018556305129799,"zero_rate":0.0}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"87.5% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"has_rings","extras":{"singletons":1,"top_values":[["True",1]]},"kind":"categorical","n":8,"n_null":7,"n_unique":1,"null_rate":0.875,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"True"}},{"alerts":[{"code":"null_rate","level":"warn","message":"87.5% null"},{"code":"constant","level":"info","message":"only one distinct value"}],"column":"ring_inner_radius_km","extras":{"histogram":{"counts":[0,0,1,0,0],"edges":[74499.5,74499.7,74499.9,74500.1,74500.3,74500.5]},"sample":[74500.0]},"kind":"numeric","n":8,"n_null":7,"n_unique":1,"null_rate":0.875,"stats":{"iqr":0.0,"kurtosis":0.0,"max":74500.0,"mean":74500.0,"median":74500.0,"min":74500.0,"n_outliers":0,"outlier_rate":0.0,"q1":74500.0,"q3":74500.0,"skew":0.0,"std":0.0,"zero_rate":0.0}},{"alerts":[{"code":"null_rate","level":"warn","message":"87.5% null"},{"code":"constant","level":"info","message":"only one distinct value"}],"column":"ring_outer_radius_km","extras":{"histogram":{"counts":[0,0,1,0,0],"edges":[140219.5,140219.7,140219.9,140220.1,140220.3,140220.5]},"sample":[140220.0]},"kind":"numeric","n":8,"n_null":7,"n_unique":1,"null_rate":0.875,"stats":{"iqr":0.0,"kurtosis":0.0,"max":140220.0,"mean":140220.0,"median":140220.0,"min":140220.0,"n_outliers":0,"outlier_rate":0.0,"q1":140220.0,"q3":140220.0,"skew":0.0,"std":0.0,"zero_rate":0.0}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"data_source","extras":{"singletons":0,"top_values":[["NASA JPL Horizons",8]]},"kind":"categorical","n":8,"n_null":0,"n_unique":1,"null_rate":0.0,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"NASA JPL Horizons"}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"fetch_date","extras":{"singletons":0,"top_values":[["2026-01-19",8]]},"kind":"categorical","n":8,"n_null":0,"n_unique":1,"null_rate":0.0,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"2026-01-19"}}],"insights":{"errors":[],"insights":[{"confidence":"high","critiques":[],"evidence_keys":["mass_earth.stats.max","mass_earth.stats.min","mass_earth.stats.median","mass_earth.n_outliers","mass_earth.outlier_rate","rotation_period_days.stats.mean","rotation_period_days.stats.min","rotation_period_days.n_outliers","has_rings.null_rate","classification.top_values","type.top_values","orbital_period_years.stats.max","orbital_period_years.stats.min","diameter_km.stats.max","diameter_km.stats.min"],"featured_charts":[{"caption":"Look for the extreme right tail \u2014 one or two gas giants dwarf all terrestrial planets by orders of magnitude.","column":"mass_earth","kind":"bar"},{"caption":"Shows the 50/25/25 split between terrestrial planets, gas giants, and ice giants.","column":"type","kind":"donut"},{"caption":"Neptune's 164-year orbit creates a sharp outlier against the tightly clustered inner planets.","column":"orbital_period_years","kind":"bar"},{"caption":"Negative values flag retrograde rotators \u2014 watch for Venus's extreme slow reverse spin at -243 days.","column":"rotation_period_days","kind":"histogram"},{"caption":"Diameter spans from 4,879 km (Mercury) to 142,984 km (Jupiter), revealing the size gulf between planet classes.","column":"diameter_km","kind":"bar"}],"model":"anthropic:default","narrative":"This dataset contains orbital and physical characteristics of all 8 planets in the Solar System, sourced from NASA JPL Horizons on 2026-01-19. The most striking feature is the extreme spread in planetary mass: values range from 0.0553 to 317.8 Earth masses, with 2 outliers (25% outlier rate) pulling the mean far above the median of 7.75 \u2014 a clear sign that Jupiter and Saturn dominate. Rotation period is equally dramatic, with a mean of -22.7 days and a minimum of -243.025 days, reflecting both retrograde rotation (Venus) and the very slow spin of some planets \u2014 worth examining closely. The dataset splits cleanly into 4 Inner Planets and 4 Outer Planets, and ring data (has_rings, ring radii) is only populated for 1 planet (87.5% null rate), consistent with Saturn being the sole ringed entry recorded.","scope":"dataset","target":"__global__"},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","cardinality","entropy","top_value","top_rate"],"model":"anthropic:default","narrative":"This column indicates whether a celestial body has rings, but with only 8 rows total and a null rate of 87.5%, just 1 non-null value exists \u2014 and that single value is 'True'. The column has cardinality of 1 and entropy of 0.0, meaning it carries zero discriminative information in its current state. The combination of near-total missingness and complete class imbalance makes this column analytically useless as-is.","role":"feature","scope":"column","target":"has_rings","treatment":"Drop or impute with domain knowledge before modelling; currently provides no signal due to 87.5% null rate and single observed value."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","mean","median","skew","std","outlier_rate","n_outliers","n","n_unique","null_rate"],"model":"anthropic:default","narrative":"This column records the rotational period of planetary or solar-system bodies in days. The most striking feature is a negative mean (-22.69) and a minimum of -243.025, which in planetary science convention indicates retrograde rotation (Venus = -243 days, Uranus \u2248 -0.718 days); these negatives are domain-valid but will surprise analysts expecting strictly positive durations. With only 8 rows, all unique, and an outlier rate of 25% (2 of 8 values), the distribution is heavily dominated by the extreme retrograde values, producing a skew of -2.02 and std of 91.33 against a median of just 0.558 days.","role":"feature","scope":"column","target":"rotation_period_days","treatment":"Do not treat negatives as errors; preserve sign to encode rotation direction, but consider splitting into |rotation_period_days| and a binary retrograde flag, then log-transform the absolute value before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","n","stats.mean","stats.std","stats.min","stats.max"],"model":"anthropic:default","narrative":"This column records the inner radius (in kilometres) of a planetary ring system. It is nearly useless in its current state: 87.5% of rows are null, and the single non-null value is constant at 74,500.0 km across all 8 rows (n_unique = 1, std = 0.0). With no variance and overwhelming missingness, the column carries no discriminative signal for modelling.","role":"feature","scope":"column","target":"ring_inner_radius_km","treatment":"Drop from modelling due to 87.5% null rate and zero variance; retain only if the single value (74500.0 km) has domain significance worth documenting as metadata."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.std","stats.mean","stats.max","stats.min","n"],"model":"anthropic:default","narrative":"This column records the outer radius (in km) of a planetary ring system. It is nearly entirely empty \u2014 87.5% null rate across only 8 rows \u2014 and the single non-null value (140,220 km) is constant across all observed cases, giving zero variance. With n_unique=1 and std=0.0, this column carries no discriminative information in the current dataset.","role":"feature","scope":"column","target":"ring_outer_radius_km","treatment":"Drop from modelling; if the dataset grows to include multiple ring systems, revisit as a numeric feature."},{"confidence":"high","critiques":[],"evidence_keys":["mean","median","max","min","skew","iqr","std","n","n_unique","n_outliers","outlier_rate"],"model":"anthropic:default","narrative":"This column records the aphelion distance (farthest orbital point from the Sun) in astronomical units for 8 solar system bodies. The mean of 8.73 AU is heavily pulled above the median of 3.56 AU by a right-skewed distribution (skew 1.10), with one flagged outlier likely representing a distant outer-planet or dwarf-planet body near the maximum of 30.33 AU (plausibly Neptune or a trans-Neptunian object). With only 8 rows and all values unique, this is a tiny reference dataset; the IQR of 11.62 and std of 11.02 underscore the enormous orbital spread across the sample.","role":"feature","scope":"column","target":"aphelion_distance_au","treatment":"With n=8, use as-is for descriptive or rule-based work; consider log-transform to reduce skew if used in any distance-based or regression model."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","mean","median","skew","n","n_unique","n_outliers","outlier_rate","null_rate"],"model":"anthropic:default","narrative":"This column represents orbital eccentricity values, likely for planets or moons in a solar system dataset (n=8 strongly suggests the eight planets). Values range from 0.00677672 to 0.20563593, consistent with known planetary eccentricities (e.g., Mercury ~0.206, nearly circular orbits near 0). The distribution is right-skewed (skew=1.49) with one flagged outlier (outlier_rate=0.125, i.e., 1 of 8 rows), almost certainly the high-eccentricity body at max=0.20563593 \u2014 a physically meaningful extreme rather than a data error.","role":"feature","scope":"column","target":"eccentricity","treatment":"Use as-is for orbital mechanics modelling; the outlier is physically valid and should not be winsorized."},{"confidence":"high","critiques":[],"evidence_keys":["mean","median","max","min","iqr","skew","n","n_unique","n_outliers","outlier_rate","null_rate"],"model":"anthropic:default","narrative":"This column records orbital inclination in degrees, likely for a small set of 8 celestial bodies (satellites, asteroids, or planets). The values cluster tightly between ~1.2\u00b0 and ~2.7\u00b0 (IQR), but the maximum of 7.00\u00b0 is flagged as an outlier and pulls the mean (2.32\u00b0) well above the median (1.81\u00b0), producing notable right skew (1.32). With only 8 rows, each a unique value and no nulls, this is a clean but extremely small sample where a single high-inclination object (\u22487\u00b0) dominates distributional shape.","role":"feature","scope":"column","target":"inclination_deg","treatment":"Use as-is or apply mild log-transform to reduce right skew before regression; flag the single outlier (max=7.00\u00b0) for domain review given the tiny sample."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","stats.min","stats.max","stats.median","stats.mean","stats.skew","stats.kurtosis","stats.iqr","stats.std","stats.n_outliers","stats.outlier_rate"],"model":"anthropic:default","narrative":"This column represents planetary mass expressed in Earth masses, almost certainly a small solar-system body catalogue (n=8 matches the eight classical planets). The distribution is extremely right-skewed (skew=1.95, kurtosis=2.19): the median is only 7.75 M\u2295 while the mean is 55.82 M\u2295, driven by the two flagged outliers that reach up to 317.8 M\u2295 (consistent with Jupiter). The IQR of 35.99 versus a std of 110.61 confirms the heavy upper tail.","role":"feature","scope":"column","target":"mass_earth","treatment":"log-transform before regression or distance-based modelling to compress the heavy right tail."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","mean","median","skew","std","iqr","n_outliers","outlier_rate","n","n_unique"],"model":"anthropic:default","narrative":"This column holds orbital period measurements in years for what appears to be a small set of 8 planetary or solar-system bodies \u2014 values spanning 0.2408467 years (roughly 88 days, consistent with Mercury) up to 164.79132 years (consistent with Neptune). The distribution is strongly right-skewed (skew = 1.49) with a mean of 36.73 years pulled well above the median of 6.87 years, and 1 outlier (12.5% of rows) at the high end \u2014 almost certainly the Neptune-like body at 164.79 years. The IQR of 42.19 and std of 59.08 both confirm the wide spread driven by that extreme upper value.","role":"feature","scope":"column","target":"orbital_period_years","treatment":"Log-transform before regression or distance-based modelling to compress the heavy right tail."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","mean","median","std","skew","n_outliers","outlier_rate","n","n_unique"],"model":"anthropic:default","narrative":"This column records perihelion distance in astronomical units (AU) \u2014 the closest orbital approach to the Sun \u2014 for 8 distinct solar system objects. With only 8 rows, the sample is tiny, yet the spread is extreme: values range from 0.31 AU (a Sun-grazing or inner-solar-system body) to 29.81 AU (near Neptune's orbit), and the standard deviation of 10.67 AU nearly equals the mean of 8.18 AU. One outlier is flagged (outlier_rate = 0.125, i.e., 1 of 8 rows), almost certainly the 29.81 AU value, which pulls the mean far above the median of 3.17 AU and drives a skew of 1.20.","role":"feature","scope":"column","target":"perihelion_distance_au","treatment":"Log-transform before modelling to reduce right skew; flag the 29.81 AU record for domain review as a potential distant trans-Neptunian object."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","mean","median","skew","n","n_unique","n_outliers","outlier_rate","null_rate"],"model":"anthropic:default","narrative":"This column contains the semi-major axis (in astronomical units) for what appears to be the 8 classical planets of our solar system, given the min of ~0.387 AU (Mercury) and max of ~30.07 AU (Neptune). The distribution is right-skewed (skew = 1.15) with the mean (8.45 AU) pulled well above the median (3.36 AU), and 1 outlier (Neptune at 30.07 AU) is flagged \u2014 unsurprising given the exponential spacing of outer planets. With only 8 rows and 8 unique values, this is essentially a lookup table with no nulls or duplicates.","role":"feature","scope":"column","target":"semi_major_axis_au","treatment":"Log-transform before regression to compress the wide outer-planet range."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","cardinality","top_rate","top_value","null_rate","entropy"],"model":"anthropic:default","narrative":"This column records the data source for each row, and every single one of the 8 records carries the identical value 'NASA JPL Horizons' (top_rate = 1.0, cardinality = 1). With zero variance and zero nulls, the column carries no discriminative information whatsoever. The imbalance alert is technically correct but understates the situation \u2014 this is a fully constant column.","role":"metadata","scope":"column","target":"data_source","treatment":"Drop before modelling; if data provenance tracking is needed, retain as a dataset-level annotation rather than a per-row column."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","top_value","top_rate","entropy","cardinality"],"model":"anthropic:default","narrative":"This column is a data-fetch or extraction timestamp recording when the dataset was retrieved. Every single one of the 8 rows carries the identical value '2026-01-19', giving it zero entropy and cardinality of 1. This makes it a constant column with no discriminative power \u2014 the 'imbalance' alert fires because top_rate is 1.0. It likely reflects a single snapshot pull rather than a longitudinal series.","role":"metadata","scope":"column","target":"fetch_date","treatment":"Drop before modelling; constant column adds no signal and wastes a feature slot."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","cardinality","entropy_ratio","null_rate","top_values"],"model":"anthropic:default","narrative":"This column contains the names of the eight planets in our solar system, each appearing exactly once (cardinality 8, n 8, null_rate 0.0). The entropy_ratio of 1.0 confirms perfectly uniform distribution \u2014 every value is unique \u2014 making this a natural row identifier rather than a grouping label. The 'long_tail' alert is a statistical artefact of the perfect uniformity, not a genuine distributional concern.","role":"identifier","scope":"column","target":"name","treatment":"Use as a row label or index key; do not one-hot encode or use as a categorical feature."},{"confidence":"high","critiques":[],"evidence_keys":["column","min","max","mean","median","iqr","skew","kurtosis","n","n_unique","null_rate"],"model":"anthropic:default","narrative":"This column represents the argument of perihelion in degrees, an orbital mechanics parameter defining the angle between an orbit's ascending node and its closest approach point to the central body. With only 8 rows, all unique, values span nearly the full 0\u2013360\u00b0 angular range (min 29.13\u00b0, max 339.39\u00b0), which is physically expected for a diverse set of orbiting bodies. The distribution is remarkably symmetric (skew \u2248 \u20130.016) with a near-flat shape (kurtosis \u20131.72), consistent with a quasi-uniform spread across the angular domain \u2014 no clustering or preferred orientation is evident. The wide IQR of 190.55\u00b0 relative to the 310.26\u00b0 total range confirms this near-uniform spread.","role":"feature","scope":"column","target":"argument_perihelion_deg","treatment":"Use as-is or encode as sine/cosine pair (sin/cos of radians) to preserve angular periodicity before modelling."},{"confidence":"medium","critiques":[],"evidence_keys":["column","n","n_unique","stats.min","stats.max","stats.mean","stats.median","stats.skew","stats.kurtosis","stats.zero_rate","null_rate"],"model":"anthropic:default","narrative":"This column represents the longitude (or argument) of the ascending node in degrees, an orbital mechanics parameter defining where an orbit crosses a reference plane. With only 8 rows, all unique and no nulls, this is a very small dataset \u2014 likely a catalogue of 8 distinct celestial bodies or orbital elements. The minimum value is exactly 0.0 (zero_rate 0.125, i.e. one record), which could be a reference orbit or a true zero-node case, but the distribution is otherwise fairly uniform across 0\u2013131.8\u00b0 with mild negative skew (-0.36) and slightly platykurtic shape (-0.63), consistent with a small, spread-out sample rather than any clustering.","role":"feature","scope":"column","target":"ascending_node_deg","treatment":"Use as-is in orbital mechanics modelling; consider sine/cosine encoding if used in a circular-aware ML pipeline, since degrees are periodic over 360\u00b0."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","min","max","mean","median","skew","kurtosis","null_rate"],"model":"anthropic:default","narrative":"This column represents the diameter in kilometres of solar system planets \u2014 the 8 unique values across n=8 rows (no nulls, no duplicates) align perfectly with the eight recognised planets. The range spans 4,879 km (Mercury) to 142,984 km (Jupiter), with a mean of 50,087 km and a median of 31,142 km, reflecting moderate right skew (0.85) driven by the gas giants pulling the distribution upward. Despite the skew, kurtosis is slightly negative (\u22120.86), indicating a flat, spread-out distribution rather than a peaked one \u2014 expected given the vast size differences across planetary classes.","role":"feature","scope":"column","target":"diameter_km","treatment":"Log-transform before regression or distance-based modelling to compress the wide range between terrestrial and gas giant values."},{"confidence":"high","critiques":[],"evidence_keys":["column","n","n_unique","stats.min","stats.max","stats.iqr","stats.std","stats.kurtosis","stats.skew","null_rate"],"model":"anthropic:default","narrative":"This column represents the mean anomaly in degrees, an orbital mechanics parameter describing the fraction of an orbital period elapsed since periapsis, typically ranging 0\u2013360\u00b0. With only 8 rows (all unique, no nulls), this appears to be a very small dataset of celestial objects or orbital elements. Values span 19.39\u00b0 to 317.02\u00b0 with a large IQR of 152.56\u00b0 and std of 109.84\u00b0, indicating wide, near-uniform spread across the angular range \u2014 consistent with the platykurtic kurtosis of \u22121.07 and mild positive skew of 0.48.","role":"feature","scope":"column","target":"mean_anomaly_deg","treatment":"Use as-is or convert to sine/cosine pair to preserve circular periodicity before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","cardinality","top_value","top_rate","entropy_ratio","top_values","null_rate"],"model":"anthropic:default","narrative":"This column classifies planets into two categories \u2014 'Inner Planet' and 'Outer Planet' \u2014 consistent with standard solar system taxonomy. The distribution is perfectly balanced, with exactly 4 instances of each class across only 8 total rows, yielding a maximum entropy_ratio of 1.0. The tiny dataset size (n=8) matches the 8 classical planets, suggesting this is a complete, exhaustive planetary dataset rather than a sample. The perfect 50/50 split is notable but expected given the known 4-inner / 4-outer planet structure of the solar system.","role":"label","scope":"column","target":"classification","treatment":"Use as a binary classification target or grouping variable; encode as 0/1 for modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","cardinality","top_value","top_rate","top_values","null_rate"],"model":"anthropic:default","narrative":"This column classifies planetary bodies into three physical types: terrestrial, gas_giant, and ice_giant \u2014 almost certainly a planet-type taxonomy from a solar system dataset. With only 8 rows and 3 categories, the dataset is tiny. 'terrestrial' dominates at 50% (4 of 8), while gas_giant and ice_giant each appear exactly twice, which mirrors the actual composition of our solar system's 8 planets.","role":"label","scope":"column","target":"type","treatment":"One-hot encode for modelling; with only 3 categories and 8 rows, verify dataset is not a toy/sample before drawing conclusions."}],"providers":["anthropic:default"],"total_usage":{"completion_tokens":5613,"prompt_tokens":15904,"total_tokens":21517}},"language_counts":{},"meta":{"generated_at":"2026-06-22T00:27:51+00:00","mode":"full","row_count":8,"sampled_rows":8,"seed":42,"source":"/home/coolhand/html/datavis/data_trove/data/quirky/planets.json"},"notes":[],"saturn_version":"0.2.0","schema":{"aphelion_distance_au":"numeric","argument_perihelion_deg":"numeric","ascending_node_deg":"numeric","classification":"categorical","data_source":"categorical","diameter_km":"numeric","eccentricity":"numeric","fetch_date":"categorical","has_rings":"boolean","inclination_deg":"numeric","mass_earth":"numeric","mean_anomaly_deg":"numeric","name":"categorical","orbital_period_years":"numeric","perihelion_distance_au":"numeric","ring_inner_radius_km":"numeric","ring_outer_radius_km":"numeric","rotation_period_days":"numeric","semi_major_axis_au":"numeric","type":"categorical"}}
