{"columns":[{"alerts":[],"column":"id","extras":{"histogram":{"counts":[682,889,623,736,297,352,305,2679,300,756,951,705,532,318,386,200,207,261,161,175,250,270,89,115,734,391,155,137,204,137,94,180,175,157,133,114,132,97,255,130],"edges":[24151805.0,361981016.9,699810228.8,1037639440.6999999,1375468652.6,1713297864.5,2051127076.3999999,2388956288.2999997,2726785500.2,3064614712.1,3402443924.0,3740273135.8999996,4078102347.7999997,4415931559.7,4753760771.599999,5091589983.5,5429419195.4,5767248407.299999,6105077619.2,6442906831.099999,6780736043.0,7118565254.9,7456394466.799999,7794223678.7,8132052890.599999,8469882102.499999,8807711314.4,9145540526.3,9483369738.199999,9821198950.099998,10159028162.0,10496857373.9,10834686585.8,11172515797.699999,11510345009.599998,11848174221.5,12186003433.4,12523832645.3,12861661857.199999,13199491069.099998,13537320281.0]},"sample":[303571498.0,317394023.0,347499962.0,375900720.0,405150976.0,429926821.0,430106185.0,447704400.0,472405793.0,474405979.0,485354347.0,486566327.0,527264097.0,538057764.0,621430174.0,656666664.0,734660697.0,813556934.0,840184351.0,947055346.0,956324598.0,956324873.0,1315977884.0,1506449074.0,1506449094.0,1545798216.0,1643395934.0,1818526205.0,1837848019.0,1842623743.0,1843049605.0,1882306295.0,1900067168.0,1906500637.0,1944497009.0,1967705198.0,1997398744.0,1997398758.0,2000639302.0,2016409992.0,2049084163.0,2049750022.0,2086249073.0,2092617401.0,2108952383.0,2146264297.0,2172384281.0,2189380043.0,2268643742.0,2282245624.0,2284773289.0,2291161878.0,2407322595.0,2407322612.0,2407322654.0,2407322676.0,2425260668.0,2431661415.0,2440549725.0,2468495679.0,2468495690.0,2468495804.0,2468495856.0,2468495903.0,2468495915.0,2468496050.0,2469448819.0,2469448890.0,2469448914.0,2469448920.0,2469448940.0,2469448946.0,2469449002.0,2469449101.0,2469449174.0,2469449373.0,2469449410.0,2469449431.0,2469449486.0,2469449623.0,2469449827.0,2469449901.0,2469449921.0,2469956957.0,2469956958.0,2469957008.0,2469957017.0,2469957023.0,2469957103.0,2469957135.0,2469957212.0,2469957242.0,2469957252.0,2469957273.0,2469957301.0,2469957305.0,2469981406.0,2469981622.0,2469996118.0,2470148215.0,2470148271.0,2470148282.0,2470148376.0,2470148382.0,2470148398.0,2470148437.0,2470315441.0,2470315771.0,2470315961.0,2470315993.0,2470315994.0,2470316000.0,2470316015.0,2470383159.0,2470383163.0,2470383273.0,2470383333.0,2470383374.0,2470383387.0,2470383458.0,2470383472.0,2470383580.0,2470409479.0,2470409503.0,2470409549.0,2470409628.0,2470409634.0,2470409834.0,2504386099.0,2523420535.0,2539779873.0,2560653666.0,2560843481.0,2560861626.0,2582734913.0,2614117246.0,2625665820.0,2628687053.0,2628998957.0,2640136772.0,2712656918.0,2791754600.0,2844219483.0,2844219673.0,2863922004.0,2898067975.0,2906437710.0,2928142500.0,2943576692.0,2943835900.0,3003268254.0,3006138595.0,3018513731.0,3029059233.0,3034495533.0,3065601780.0,3117266935.0,3155205969.0,3165463761.0,3170159361.0,3188072247.0,3203787845.0,3259085925.0,3324271420.0,3331953091.0,3332497653.0,3332942846.0,3334352184.0,3334436818.0,3349576571.0,3370627767.0,3372347214.0,3377769896.0,3402688570.0,3404937512.0,3406947932.0,3407566220.0,3412454612.0,3412454622.0,3414873416.0,3414873421.0,3421082200.0,3421082209.0,3423854445.0,3423854468.0,3423854474.0,3437133102.0,3473932398.0,3475111274.0,3494809762.0,3497727603.0,3504849509.0,3510039161.0,3595930810.0,3596929097.0,3607742815.0,3624001463.0,3648342932.0,3681396261.0,3704238760.0,3726791221.0,3818688161.0,3931466339.0,3954296778.0,3978534989.0,3980596284.0,3994147236.0,3994147243.0,3994189708.0,3994189709.0,3994189711.0,3994189713.0,3994189742.0,3994190665.0,3994190713.0,3994226680.0,3994226711.0,3994226712.0,3994226751.0,3994227460.0,3999273889.0,4002129011.0,4004975964.0,4004998422.0,4006047814.0,4006470889.0,4013145586.0,4045352308.0,4077791998.0,4077843705.0,4077876798.0,4078026332.0,4078026337.0,4078118805.0,4080961838.0,4080961846.0,4080961881.0,4080961882.0,4080962095.0,4111597197.0,4111597804.0,4142604490.0,4178225167.0,4235391727.0,4298334828.0,4298472638.0,4298701819.0,4298735126.0,4306892167.0,4329850133.0,4350915587.0,4365477361.0,4367050158.0,4398015290.0,4436523743.0,4465410682.0,4549942567.0,4553351706.0,4559723157.0,4579378981.0,4595246891.0,4599901910.0,4656921386.0,4683280940.0,4705591771.0,4818198111.0,4875713308.0,4942010360.0,4973205762.0,4976702728.0,5056454313.0,5157876060.0,5179641604.0,5179710829.0,5251146253.0,5339167741.0,5339387690.0,5351785120.0,5420994442.0,5465028248.0,5609912223.0,5609912224.0,5613863073.0,5622327928.0,5701609814.0,5742270500.0,5859222459.0,5859222472.0,5859222478.0,5891332933.0,5945488638.0,5971438525.0,5997815086.0,6026222509.0,6126932928.0,6132822802.0,6287095838.0,6564922640.0,6598765746.0,6636682165.0,6791509463.0,6943571705.0,6969196247.0,7025928018.0,7036587784.0,7072207567.0,7172923202.0,7230037387.0,7234300185.0,7234302685.0,7234321986.0,7471687559.0,7660400546.0,7676209059.0,7740330309.0,7846534433.0,7862154325.0,7943103641.0,7947745297.0,8176909545.0,8212693218.0,8237961249.0,8242887914.0,8275494594.0,8283800981.0,8284019543.0,8284305311.0,8285934278.0,8326017489.0,8356910091.0,8356910094.0,8412103752.0,8412115024.0,8415441810.0,8420978104.0,8423083411.0,8430696886.0,8438977587.0,8439915034.0,8445587915.0,8449085106.0,8452017276.0,8453240523.0,8456382909.0,8460139752.0,8481837786.0,8484833289.0,8484848211.0,8504728389.0,8507517201.0,8509090169.0,8514901788.0,8516396231.0,8521998031.0,8529188814.0,8530683612.0,8530791942.0,8582209419.0,8592577516.0,8850442330.0,8851345678.0,8891154307.0,8911215813.0,8935980115.0,8997876818.0,9157946836.0,9373742487.0,9404088689.0,9421469375.0,9581631334.0,9583430185.0,9617086359.0,9682921017.0,9706030301.0,9727457360.0,9782058412.0,9851543057.0,9873165430.0,9909911127.0,9913004745.0,9913004747.0,10051040956.0,10082969289.0,10239822580.0,10266185152.0,10309405911.0,10579303201.0,10581404385.0,10589075284.0,10589075316.0,10608625582.0,10608625583.0,10658487759.0,10727792433.0,10731025880.0,10737002808.0,10775879853.0,10777394187.0,10903409927.0,10921116068.0,11038172332.0,11076127884.0,11094341472.0,11096507729.0,11238605970.0,11333186341.0,11353494455.0,11425927039.0,11444278761.0,11514332612.0,11646935872.0,11647011904.0,11738674352.0,11871248494.0,11989516928.0,12167730056.0,12188456258.0,12292218722.0,12311639568.0,12393359740.0,12393359741.0,12459039956.0,12829036477.0,12865158021.0,12866471545.0,12866484503.0,12866484508.0,12999781951.0,13011944460.0,13063886614.0,13090618908.0,13197867541.0,13319663284.0,13369286237.0,83889115.0,174713139.0,178679962.0,189547431.0,201487153.0,241020548.0,266656347.0,266667794.0,305371142.0,312396995.0,314891717.0,321331724.0,370452347.0,370452349.0,370460523.0,372012651.0,375486211.0,375488010.0,377360897.0,390207429.0,405650383.0,456202924.0,460285327.0,460345819.0,498850106.0,504873532.0,534410698.0,538353502.0,541508807.0,587874956.0,619186237.0,647535176.0,670560732.0,759536204.0,759536210.0,767335437.0,768601925.0,795027640.0,891689827.0,901745746.0,915580051.0,960907460.0,978430366.0,978430377.0,978430384.0,978430413.0,1017806301.0,1044488814.0,1083776237.0,1125397109.0,1130935890.0,1130939166.0,1137373140.0,1137845772.0,1138151187.0,1145086685.0,1204032676.0,1232042586.0,1239192285.0,1244773806.0,1252970907.0,1253430473.0,1284606543.0,1414951043.0,1414953927.0,1415213018.0]},"kind":"numeric","n":15464,"n_null":0,"n_unique":15464,"null_rate":0.0,"stats":{"iqr":4470637943.25,"kurtosis":-0.20064733809425084,"max":13537320281.0,"mean":4503184709.8944,"median":3411205875.5,"min":24151805.0,"n_outliers":0,"outlier_rate":0.0,"q1":2374723033.5,"q3":6845360976.75,"skew":0.890734864386113,"std":3470459882.4900117,"zero_rate":0.0}},{"alerts":[],"column":"osm_type","extras":{"singletons":0,"top_values":[["node",13311],["way",2153]]},"kind":"categorical","n":15464,"n_null":0,"n_unique":2,"null_rate":0.0,"stats":{"cardinality":2,"entropy":0.5822097333793447,"entropy_ratio":0.5822097333793447,"top_rate":0.8607734092084842,"top_value":"node"}},{"alerts":[{"code":"one_word","level":"warn","message":"37.8% rows are a single word"},{"code":"duplicates","level":"warn","message":"36.2% duplicate strings"}],"column":"name","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[4725,27,252,552,420,493,810,1037,1247,1295,1726,831,680,447,283,185,134,86,83,37,43,15,13,13,4,9,4,1,5,2,2,1,0,1,0,0,0,0,0,1],"edges":[0.0,2.1,4.2,6.300000000000001,8.4,10.5,12.600000000000001,14.700000000000001,16.8,18.900000000000002,21.0,23.1,25.200000000000003,27.3,29.400000000000002,31.5,33.6,35.7,37.800000000000004,39.9,42.0,44.1,46.2,48.300000000000004,50.400000000000006,52.5,54.6,56.7,58.800000000000004,60.900000000000006,63.0,65.10000000000001,67.2,69.3,71.4,73.5,75.60000000000001,77.7,79.8,81.9,84.0]},"near_unique":false,"sample":["Crow Hill Cairn Circle","Arkaun","Su Nuraxi","","Sornaichean Coir' Fhinn","Shaori fortress-1","Anta do Monte da Caeira 2","Tomba dei Giganti","","Menhir von Benzingerode","Table du Jars","F\u00e5r\u00f6 14:1","Nuraghe Marchiesu","Menhir dit la Pierre Fiche de Chac\u00e9","Bruncu Forru","","","Nuraghe San Priamo I","Nuraghe Aurras [Tramatza]","Kapanasta","Dolmen de la Pierre Blanche","Schlingsteine","","Menhir du Coulet B","Menhir de Lestenach","Dolmen de M\u00e9arzenne","\u041c\u0435\u0433\u0430\u043b\u0438\u0442\u044b","","","Nuraghe Montarveddu","Gro\u00dfsteingrab Grebbin","Gro\u00dfsteingrab Tessin","Gro\u00dfsteingrab Gnewitz 6","Menhir Iguzkiko Lepoa","Dolmen Gorafe 89","Antas das Figueirinhas","Achavanich Stone Circle","","Mamoa de Outeiro de Gregos 2","Langbett Gro\u00dfenbrode","","","Dolmen1-G\u00e9antes","","Nuraghe Cae","Dolmen de Port Blanc","Errebelu","Saroiko Bisker","","Nuraghe Cabudbbene II"],"top_values":[["",4720],["\u0414\u043e\u043b\u044c\u043c\u0435\u043d",191],["Dermot & Grania's Bed",62],["Dolmen",51],["Menhir",50],["Standing Stone",48],["\u0414\u043e\u043b\u044c\u043c\u0435\u043d (\u0440\u0430\u0437\u0440\u0443\u0448\u0435\u043d)",34],["Giant's Grave",31],["A Hurler",30],["Stone Circle",23],["Tomasu",10],["All\u00e9e couverte",9],["Dolmen de la Pierre Lev\u00e9e",9],["Druid's Altar",8],["Okabe harrespila / Cromlech d'Okabe",8],["Nuraghe",7],["Langer Stein",6],["\u0414\u043e\u043b\u044c\u043c\u0435\u043d\u044b",5],["Cairn",5],["Tomba dei Giganti",5]],"top_words":[["de",2765],["dolmen",2088],["menhir",1162],["nuraghe",950],["la",881],["gro\u00dfsteingrab",864],["du",537],["1",498],["stone",476],["2",445],["anta",404],["pierre",362],["da",355],["do",281],["\u0434\u043e\u043b\u044c\u043c\u0435\u043d",263],["des",258],["circle",241],["3",223],["dit",220],["del",183],["couverte",164],["all\u00e9e",148],["standing",137],["4",119],["di",111]],"vocab_skipped":null,"word_histogram":{"counts":[5849,0,2429,0,0,3652,0,1854,0,0,973,0,477,0,0,142,0,47,0,0,20,0,15,0,0,3,0,1,0,2],"edges":[1.0,1.4,1.8,2.2,2.6,3.0,3.4000000000000004,3.8000000000000003,4.2,4.6,5.0,5.4,5.800000000000001,6.2,6.6000000000000005,7.0,7.4,7.800000000000001,8.2,8.600000000000001,9.0,9.4,9.8,10.200000000000001,10.600000000000001,11.0,11.4,11.8,12.200000000000001,12.600000000000001,13.0]}},"kind":"text","n":15464,"n_null":0,"n_unique":9869,"null_rate":0.0,"stats":{"allcaps_rate":0.0031686497672012417,"boilerplate_rate":0.0,"duplicate_rate":0.3618080703569581,"emoji_rate":0.0,"len_max":84,"len_mean":13.64685721676151,"len_median":15.0,"len_min":0,"len_p95":30.0,"n_duplicates":5595,"n_empty":4720,"one_word_rate":0.37823331608898086,"readability_flesch_mean":46.90115357142859,"url_rate":0.0,"vocab_size":9447,"word_mean":2.494632695292292,"word_median":2.0}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=-3.09"}],"column":"lat","extras":{"histogram":{"counts":[1,0,0,0,1,0,3,0,2,0,1,1,4,4,8,21,3,13,26,1,7,5,8,2,5,2,8,3,9,38,523,2211,3646,3269,1808,1660,1627,506,33,5],"edges":[-51.8088639,-48.884412075,-45.95996025,-43.035508425,-40.1110566,-37.186604775,-34.26215295,-31.337701125,-28.4132493,-25.488797475000002,-22.56434565,-19.639893825,-16.715442000000003,-13.790990175000005,-10.866538349999999,-7.942086525000001,-5.017634700000002,-2.0931828750000037,0.8312689499999948,3.7557207750000003,6.680172599999999,9.604624424999997,12.529076249999996,15.453528075000001,18.377979899999993,21.302431724999998,24.22688354999999,27.151335374999995,30.0757872,33.00023902499999,35.92469085,38.84914267499999,41.773594499999994,44.698046325,47.62249814999999,50.546949975,53.47140179999999,56.395853624999994,59.32030545,62.24475727499999,65.1692091]},"sample":[53.1624837,54.078374,47.7918477,47.9365383,54.23749,55.0474107,54.8307668,42.3297649,53.661108,48.0919805,51.7461184,42.6000685,52.2717459,52.3572996,47.4363212,47.7143845,53.6337909,48.6729202,43.9574108,44.1249094,44.0175375,44.0156302,54.2190289,44.4845157,44.48835,44.6156285,41.9038398,55.7973692,53.4880139,47.245948,39.7368417,46.4435433,47.7943388,52.7538668,48.1057078,56.3609234,50.516869,50.5170201,48.9522457,40.011016,40.0473349,44.4799351,48.4627191,43.29979,45.9906557,52.2721842,51.5409947,53.0450808,47.197972,43.2279766,51.8181416,43.1878919,44.2350787,44.2351917,44.2354922,44.2356741,52.872824,45.1239628,46.0501979,47.5918884,47.59193,47.592111,47.5922036,47.5922641,47.5922792,47.5923919,47.5920893,47.5921975,47.5922211,47.5922397,47.5922687,47.592267,47.5923371,47.5924272,47.5924876,47.5926599,47.5926794,47.5926942,47.5927337,47.5928657,47.5930303,47.5931514,47.5932122,47.5929702,47.5929804,47.5932913,47.5933071,47.5933233,47.5934603,47.5935643,47.5937194,47.5938563,47.593913,47.5940386,47.5940943,47.5941118,47.5949009,47.5950916,47.5929381,47.5959059,47.5962573,47.5962905,47.596551,47.5965676,47.5966052,47.5966934,47.5967905,47.5976073,47.5979473,47.5980282,47.5980292,47.5980677,47.5981533,47.5987723,47.5988358,47.5991425,47.5992323,47.599413,47.5994761,47.5999363,47.6004728,47.6011378,47.6042002,47.6042735,47.6043761,47.6044421,47.6044614,47.6048947,50.1645189,46.6288258,56.1228207,43.7613932,40.0569576,40.0350274,40.224467,43.3635218,22.7922111,43.5292653,43.5235266,46.4844642,48.7923465,42.7258018,39.7200095,39.7170142,43.1445452,54.840462,44.3264893,58.1676025,44.4086022,44.0450534,43.2652561,54.1017064,41.6687997,48.7860491,48.6398949,53.8620536,40.8286826,47.8186671,48.1358245,48.1176927,53.3678445,53.1309978,44.5628122,45.7821391,49.8619228,42.9292357,42.992941,42.9400201,43.2948758,38.5134165,43.0002439,42.9057464,42.9719074,42.9889182,37.4684709,42.6643832,42.9446501,43.3050639,43.2981321,43.2310116,43.2680259,37.4511047,37.4472613,43.1090669,43.0921382,43.1083013,43.1020917,43.0808132,43.2122673,52.4821628,42.8559511,43.825203,44.4080188,41.2034302,42.0094796,39.8955168,58.3868494,44.4287879,52.8021774,49.7216231,39.8379774,47.3099536,40.0957253,41.1802682,43.5251015,39.8480489,39.4001554,39.44495,38.7038104,38.705243,38.60339,38.6976381,38.64505,38.86881,38.87573,40.6914237,40.695025,41.0357701,40.442472,40.8161,41.02264,37.5762009,38.6838328,39.411264,40.9420678,40.8347632,42.0711626,52.7768429,47.5919191,47.5916631,47.492329,47.7647699,47.76486,47.6638475,47.6345422,47.634516,47.6342828,47.6342575,47.6344871,43.9056161,43.9686136,43.9216156,43.1348155,46.876244,57.6014514,58.2849335,58.9600478,58.9273871,59.3005472,55.9539097,44.5636227,50.5197664,54.2519854,54.8001885,44.3903533,44.7393619,47.0832102,1.8803328,40.0110739,44.3708992,43.2327096,47.8586402,44.7483946,43.1675671,44.1937934,57.0451308,49.2818335,48.6619978,43.7971176,44.5794581,47.3393934,43.0468851,44.541022,44.5297417,44.5007888,54.2960037,47.2689642,25.7154659,43.6881422,44.5493995,48.3897349,48.3856524,48.3994609,51.5869855,54.3913958,46.9460146,48.2736849,48.2734367,48.2732582,40.1308973,40.3877878,42.7550472,36.9229588,45.7889311,43.1011385,48.5859338,44.4995492,40.9043989,53.5239895,45.0829966,42.5462646,39.2385482,38.83851,36.9960649,43.792482,41.389035,41.4906679,42.62861,42.29667,42.38694,41.81167,42.8480346,41.6239822,46.4696469,44.8512509,47.8300018,53.2860814,53.3875625,53.3626624,52.7403322,53.5322324,54.0577529,53.8972933,54.0094849,53.8915273,53.8309302,53.6725296,53.7773767,49.1697283,48.1496718,48.0696125,48.5332466,48.5764524,45.236883,47.6171086,47.70909,46.1577838,47.2486592,44.1830445,47.6934108,43.5929505,48.2224528,47.2381653,47.839867,47.8143231,43.0772063,45.1724833,48.5363284,44.0392129,47.6285393,44.2491987,44.3813035,45.3134608,44.1151814,53.1678295,44.3328603,41.7384116,44.4241731,50.0598428,54.4976677,54.492364,54.4357964,54.2599692,54.0583393,47.5168291,50.0957357,52.7928181,44.4840954,47.3900695,44.5123808,52.4636564,52.483775,54.4210827,40.147022,51.1426262,42.0118143,42.8872049,54.2912145,43.825369,43.7962678,43.9014563,43.4060564,51.459364,53.2152866,53.6650972,52.729218,38.6884174,38.9059114,39.7982857,39.8199663,39.8869414,39.8868839,52.5118414,39.8591723,57.3567013,54.0465915,56.8760532,37.5598728,53.7513534,14.7483512,53.6942771,44.2260825,57.4937729,42.4262054,55.9239528,40.9229176,44.3872535,54.0407103,38.1074162,41.0931404,51.8131424,51.868482,52.3685578,49.8250213,44.0483165,53.3958077,40.3487105,44.3651377,56.5622389,38.959305,38.962602,53.2252369,48.302683,39.3796516,39.2880552,39.2985204,39.1843989,40.6371092,47.5960302,39.130929,43.6780713,55.5378347,52.1726922,52.5579223,40.5949293,52.6505829,46.6839013,50.670596,39.3949145,51.4208393,40.2264375,40.2247148,53.3452357,38.557489,39.8541235,40.1287709,39.7055709,39.7056807,40.2582198,39.8515647,40.5914439,40.5541249,54.2344197,50.1585599,47.7652096,55.5818197,40.5306607,40.0350603,39.8227527,40.5774416,56.2707673,53.2039363,54.0554216,40.6505739,56.4909412,37.9802781,55.712015,51.4276153,51.4292198,53.9288462,40.4164163,54.2353186,40.6233524,50.5905098,55.3912598,52.2072776,39.7062048,39.7058815,39.7058234,39.7061606,40.4007705,48.8788207,57.2915961,51.4127268,39.4428792,39.3218887,54.6895135,54.2361633,39.8571677,52.5084491,47.8972555,39.4790776,54.1788173,51.9882981,51.8812262,51.8180605,54.0283103,40.3130534,40.1991671,38.9813381]},"kind":"numeric","n":15464,"n_null":0,"n_unique":15320,"null_rate":0.0,"stats":{"iqr":7.569137749999996,"kurtosis":26.331405038521762,"max":65.1692091,"mean":46.414525102121054,"median":47.59247835,"min":-51.8088639,"n_outliers":134,"outlier_rate":0.0086652871184687,"q1":42.94914862500001,"q3":50.518286375,"skew":-3.087121456695528,"std":6.810069979161207,"zero_rate":0.0}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=+3.65"}],"column":"lon","extras":{"histogram":{"counts":[1,0,0,1,0,1,1,2,2,6,34,2,1,5,1,0,0,0,4,3136,7654,3031,921,58,15,441,21,3,0,1,7,7,7,1,19,7,23,30,15,6],"edges":[-151.3584628,-143.9560541825,-136.553645565,-129.15123694750002,-121.74882833000001,-114.34641971250001,-106.94401109500001,-99.5416024775,-92.13919386,-84.7367852425,-77.334376625,-69.9319680075,-62.52955939,-55.1271507725,-47.724742155,-40.3223335375,-32.91992492,-25.5175163025,-18.115107684999998,-10.712699067499983,-3.3102904499999966,4.09211816749999,11.494526785000005,18.89693540250002,26.299344020000007,33.70175263749999,41.10416125500001,48.50656987250002,55.90897849000001,63.311387107499996,70.71379572500001,78.11620434250003,85.51861296000001,92.9210215775,100.32343019500001,107.72583881250003,115.12824743000002,122.5306560475,129.93306466500005,137.33547328250003,144.7378819]},"sample":[-1.6449916,11.9526491,-4.2653301,-1.4048786,10.60158,10.1285896,-2.7100364,3.1338031,8.7711282,-4.3795644,-2.0937861,-9.0167702,11.3430554,8.1490604,-2.1365533,-3.4690737,9.3723627,-3.5018541,2.9948298,39.1272725,39.3745047,39.3799335,-7.3407867,38.4411317,38.4065164,1.786805,3.1223533,12.3408143,9.5430733,-2.2933114,8.9655307,-1.4660855,-3.4439674,10.8505159,-4.3823988,-5.8606231,-4.4582193,-4.4577979,2.2827163,9.0305444,8.6789082,38.4057139,-5.0375472,-1.8320847,-1.0002541,11.3459436,11.905453,8.4508471,-2.1535008,-1.9589511,11.9284998,-1.9555801,40.5353509,40.5342876,40.5351316,40.5352843,7.5246885,3.0497272,1.1116382,-3.0845366,-3.083258,-3.0829868,-3.0831333,-3.0828766,-3.0823455,-3.0823232,-3.0841292,-3.0836831,-3.085182,-3.0844012,-3.0834064,-3.0846654,-3.0835857,-3.084386,-3.0823461,-3.083072,-3.0829535,-3.0828849,-3.0833872,-3.0820001,-3.0822119,-3.0817163,-3.0808151,-3.0803509,-3.0803145,-3.0797217,-3.0789293,-3.0785805,-3.0792369,-3.0796986,-3.0779434,-3.0782366,-3.0774194,-3.0773438,-3.0773952,-3.0778306,-3.0741955,-3.0742309,-3.0797748,-3.0664154,-3.0669984,-3.0672554,-3.0658542,-3.0663577,-3.0659888,-3.0652047,-3.0642183,-3.0630498,-3.0632836,-3.0621907,-3.0630964,-3.0621069,-3.0627879,-3.0603746,-3.0602605,-3.0598569,-3.059496,-3.0589952,-3.0589574,-3.0583214,-3.057346,-3.0556775,-3.0494567,-3.0502306,-3.0472264,-3.0487021,-3.0488601,-3.0498194,4.0841198,10.8879311,-5.4960296,3.5090769,8.731781,8.5363565,-5.9494073,2.7608146,121.1211473,3.5496306,3.5721808,1.7190311,-3.5701119,-1.2241719,9.0219595,8.9880424,-8.94424,9.5684403,4.3956,13.5769176,3.6242355,3.0518314,-1.7592596,9.1893704,44.1547821,-3.3271763,-3.2043954,11.2816054,8.8861572,-4.3230076,-3.7664193,-3.8100772,9.774327,-4.2063555,4.4404759,3.1469475,7.1779803,-2.2500094,-2.0941256,-2.1592968,-2.0811131,-6.8986423,-1.5859287,-1.2527697,-1.3449892,-1.7542972,-3.0480587,-1.1307173,-0.8375615,-1.6591056,-1.6721203,-1.7658449,-1.7408319,-3.0207468,-3.0212948,-1.775805,-1.8280906,-1.7823456,-1.4930797,-1.5641476,-1.5014733,7.8850594,-1.4287255,3.7928637,1.9057331,-8.0075339,1.0023842,4.1881574,-3.3975872,4.2939123,7.8723587,6.8408454,18.2473417,-2.4302082,8.8518678,16.5095783,-5.7890929,18.3610313,-7.4907269,-7.4719,-8.080646,-8.079478,-8.07804,-8.2373474,-8.16624,-7.9773,-7.95011,-8.3039585,-7.988574,-7.4375187,-7.9436291,-7.7308,-7.4211,-8.2606535,-7.66473,-7.499067,-7.6805566,-7.7554599,-8.0959293,7.5572703,-3.0860257,-3.0862146,-2.8343079,-1.9739692,-1.974334,8.4016933,-3.1489731,-3.1487263,-3.1487263,-3.1487021,-3.1478009,39.4129571,39.3887708,39.4318729,-1.4745342,4.5342522,12.1097977,11.5429297,11.3176094,11.3171567,18.4120972,-2.6782896,38.2314392,-4.4719649,-8.5163338,12.0864741,4.0281819,0.7533383,-0.02686,-76.3032222,9.0305428,3.0026921,-1.4643299,0.0929421,38.0447909,-1.8032294,40.5456304,-2.3399736,-0.4426758,3.7254676,3.4139979,38.0942546,-0.2563226,-2.762461,1.8777405,1.8554353,1.8653236,-3.0227101,0.7941803,91.9203302,3.4166253,2.124677,-3.0468231,-3.0526918,-2.7945855,-9.6952928,-1.0369895,-0.138294,-4.6094875,-4.6100695,-4.6098657,18.2836583,9.284674,10.1903603,15.1581203,8.02733,40.8488415,-0.2438515,1.9915429,-7.8200748,12.9345115,1.6224415,2.343395,9.4889488,-8.11853,-3.8977488,3.3904275,-7.514996,-7.7205504,2.3275,0.96111,2.8925,2.15028,-8.0239659,2.4929121,-1.5018158,1.7598155,-3.0263889,8.6512318,14.2229987,13.803758,11.2446285,11.8027409,12.4997824,11.9512074,13.2040325,13.6099821,13.1174111,11.6019046,13.3194521,1.328207,1.4103842,1.5021796,-4.7478379,-4.6295248,2.9409612,-3.1285508,-3.2457689,2.0579406,-2.0869324,3.3770314,-3.254058,2.6634635,-4.541682,-2.0798347,-3.6001436,-3.6288229,2.643061,3.8072187,-1.5265,3.7821602,-3.1646051,3.0423647,4.1547129,1.4982542,4.2719168,-1.6293347,4.2445986,8.827572,2.9396863,-5.5947549,9.8842898,9.8664735,10.0690833,9.8986934,10.3283789,-3.1288902,-5.5783517,-4.0348128,38.401975,-2.9681835,1.9153178,-8.1685844,-8.1495434,-0.5827219,8.6062539,11.8438175,8.6880215,-0.7266542,-3.0300366,2.7033,2.8059035,2.8505218,5.231303,11.2458317,-6.154889,-8.4048045,-3.9303267,-7.6792599,-7.3662443,9.6181488,9.6153841,9.6529301,9.653056,-8.5200611,9.2329375,-2.4245234,-8.1261733,13.9802635,-6.7175957,12.0111332,39.4254962,-6.4752582,3.7846801,-2.1992625,25.4393983,-3.6158905,-8.388948,2.527918,12.6213499,-8.7260574,-5.9980192,-8.9880742,-8.9233834,-7.3899466,5.7284182,10.284171,-4.460711,8.6913533,1.7662199,-3.5109201,-7.437693,-7.446428,-4.4046626,-0.7549126,9.5343289,9.5765851,9.5998138,9.5726524,8.6666361,-3.0641648,-7.617071,6.8018393,-3.0273429,-10.0728267,-9.6218401,8.2428866,11.0228082,0.405384,-3.9053641,8.813614,-1.8462306,8.6028519,8.7341379,9.9406339,-8.0611743,8.9586227,8.8583604,8.991326,8.9914618,9.4861199,9.4015266,8.6068013,8.6134807,-3.1510555,-5.6044972,-1.9896499,9.1450441,9.3239912,9.616572,9.4778758,9.1464348,10.509473,-4.2174813,-8.3778948,9.4068765,10.512876,38.7400264,-5.6137021,-1.8555986,-1.8562774,17.6915147,8.6296682,-3.1510001,8.5011647,-4.5606646,11.3039486,7.792162,8.9907962,8.9909235,8.9910078,8.9905425,17.6839684,-1.8211983,-2.399962,-1.8282741,9.1140834,9.2332452,-8.7747197,-9.2573179,9.6600343,-8.5319727,-4.2203485,9.0003266,-7.1051667,-8.8877832,-8.7908915,-8.913717,-9.1340657,9.3999203,9.3433742,8.4099874]},"kind":"numeric","n":15464,"n_null":0,"n_unique":15407,"null_rate":0.0,"stats":{"iqr":11.5306975,"kurtosis":34.34086849318756,"max":144.7378819,"mean":2.61819560683523,"median":-1.6201083,"min":-151.3584628,"n_outliers":676,"outlier_rate":0.043714433523021214,"q1":-3.08339485,"q3":8.447302650000001,"skew":3.6537140695024246,"std":14.643722734537622,"zero_rate":0.0}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 97.7% of rows"}],"column":"type","extras":{"singletons":7,"top_values":[["megalith",15113],["menhir",156],["dolmen",83],["standing_stone",59],["stone_circle",16],["nuraghe",8],["gallery_grave",6],["passage_grave",5],["lech",4],["stone_ship",3],["tholos",2],["chamber",2],["village",1],["plaque",1],["cist",1],["long_barrow",1],["chambered_cairn",1],["grave_field",1],["stone",1]]},"kind":"categorical","n":15464,"n_null":0,"n_unique":19,"null_rate":0.0,"stats":{"cardinality":19,"entropy":0.20956605478377352,"entropy_ratio":0.049333717235181505,"top_rate":0.9773021210553544,"top_value":"megalith"}},{"alerts":[],"column":"megalith_type","extras":{"singletons":29,"top_values":[["menhir",5231],["dolmen",4501],["",1714],["nuraghe",1080],["stone_circle",1011],["passage_grave",537],["chamber",437],["long_barrow",184],["alignment",116],["cist",107],["gallery_grave",85],["standing_stone",68],["stone_ship",47],["tholos",32],["court_tomb",32],["round_barrow",25],["well",23],["wedge_tomb",23],["cairn",20],["stone",20]]},"kind":"categorical","n":15464,"n_null":0,"n_unique":73,"null_rate":0.0,"stats":{"cardinality":73,"entropy":2.749116203786542,"entropy_ratio":0.44413475335785046,"top_rate":0.33826952922917747,"top_value":"menhir"}},{"alerts":[{"code":"long_tail","level":"info","message":"558 singleton categories"},{"code":"imbalance","level":"warn","message":"top value is 95.8% of rows"}],"column":"description","extras":{"singletons":558,"top_values":[["",14814],["J\u00e6ttestue",11],["Anta da Herdade da Ordem",8],["Stone circle",5],["Gro\u00dfsteingrab",5],["Rest eines Gro\u00dfsteingrabes",5],["Long Barrow",4],["Dolmen",4],["Langdysse",4],["Four standing and one recumbent standing stone.",4],["pair of two standing stones",4],["H\u00fcnengrab",3],["Henge / C\u00edrculo l\u00edtico",3],["Menhir",2],["\u0413\u0430\u0440\u043c\u043e\u043d\u0438\u044f",2],["Runddysse",2],["All\u00e9e couverte",2],["Stendysse",2],["Tumulus, dalle de couverture",2],["Table, chevet, orthostates droit et gauche",2]]},"kind":"categorical","n":15464,"n_null":0,"n_unique":587,"null_rate":0.0,"stats":{"cardinality":587,"entropy":0.6327713258244647,"entropy_ratio":0.06880030632511847,"top_rate":0.9579668908432488,"top_value":""}},{"alerts":[{"code":"one_word","level":"warn","message":"85.2% rows are a single word"},{"code":"duplicates","level":"warn","message":"86.7% duplicate strings"}],"column":"wikipedia","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[13060,0,0,1,3,21,47,28,159,115,191,236,271,254,203,130,198,133,110,75,49,97,30,6,12,7,4,2,8,3,3,0,0,3,0,1,1,0,1,2],"edges":[0.0,1.875,3.75,5.625,7.5,9.375,11.25,13.125,15.0,16.875,18.75,20.625,22.5,24.375,26.25,28.125,30.0,31.875,33.75,35.625,37.5,39.375,41.25,43.125,45.0,46.875,48.75,50.625,52.5,54.375,56.25,58.125,60.0,61.875,63.75,65.625,67.5,69.375,71.25,73.125,75.0]},"near_unique":false,"sample":["","","it:Su Nuraxi","","","ka:\u10e8\u10d0\u10dd\u10e0\u10d8\u10e1 \u10ea\u10d8\u10ee\u10d4","","","","de:Menhir von Benzingerode","","","","","","","","","","","fr:Dolmen de la Pierre Blanche","de:Schlingsteine","","","","","","","","","de:Gro\u00dfsteingr\u00e4ber bei Grebbin","de:Gro\u00dfsteingrab Tessin","de:Gro\u00dfsteingr\u00e4ber von Gnewitz","","","","en:Achavanich","","","de:Langbett Krausort","","","","","","","","","",""],"top_values":[["",13060],["de:Gro\u00dfsteingr\u00e4ber im Haldensleber Forst",70],["pt:Necr\u00f3pole Megal\u00edtica do Bustelo",17],["de:Liste der Navetas",14],["en:Drizzlecombe",9],["de:Gro\u00dfsteingr\u00e4ber bei Leetze",8],["de:Megalithanlagen bei Westerwanna",7],["de:Gro\u00dfsteingr\u00e4ber bei Tangeln",7],["de:Gro\u00dfdolmen von Sassen",7],["de:Dolmen von Putlos",7],["de:Gro\u00dfsteingr\u00e4ber bei Lindh\u00f6ft",6],["de:Gro\u00dfsteingr\u00e4ber bei L\u00fcdelsen",6],["de:Gro\u00dfsteingr\u00e4ber von Gnewitz",6],["de:Gro\u00dfsteingr\u00e4ber bei Nehmten",5],["de:Sieben Steinh\u00e4user",5],["de:Gro\u00dfsteingr\u00e4ber bei Strehlow",5],["en:Timoney Stones",5],["en:Carrowmore",5],["de:Gro\u00dfsteingr\u00e4ber bei Behrensbrook",4],["de:H\u00fcnenbetten von Daudieck",4]],"top_words":[["de",680],["de:gro\u00dfsteingr\u00e4ber",345],["bei",268],["fr:dolmen",213],["la",196],["von",173],["de:gro\u00dfsteingrab",169],["fr:menhir",156],["ca:dolmen",118],["du",114],["fr:pierre",97],["im",92],["forst",79],["del",71],["haldensleber",70],["des",69],["couverte",67],["stone",61],["fr:all\u00e9e",56],["(hunebed)",55],["pierre",43],["circle",41],["di",39],["fr:dolmens",38],["de:dolmen",34]],"vocab_skipped":null,"word_histogram":{"counts":[13182,0,0,443,0,0,1040,0,0,494,0,0,178,0,0,86,0,0,25,0,0,8,0,0,3,0,0,3,0,2],"edges":[1.0,1.3333333333333333,1.6666666666666665,2.0,2.333333333333333,2.6666666666666665,3.0,3.333333333333333,3.6666666666666665,4.0,4.333333333333333,4.666666666666666,5.0,5.333333333333333,5.666666666666666,6.0,6.333333333333333,6.666666666666666,7.0,7.333333333333333,7.666666666666666,8.0,8.333333333333332,8.666666666666666,9.0,9.333333333333332,9.666666666666666,10.0,10.333333333333332,10.666666666666666,11.0]}},"kind":"text","n":15464,"n_null":0,"n_unique":2058,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.8669167097775479,"emoji_rate":0.0,"len_max":75,"len_mean":4.100038799793068,"len_median":0.0,"len_min":0,"len_p95":29.0,"n_duplicates":13406,"n_empty":13060,"one_word_rate":0.8524314536989136,"readability_flesch_mean":5.479500000000004,"url_rate":0.0,"vocab_size":2769,"word_mean":1.3507501293326436,"word_median":1.0}},{"alerts":[{"code":"one_word","level":"warn","message":"100.0% rows are a single word"},{"code":"allcaps","level":"info","message":"30.0% rows are all-caps"},{"code":"short_text","level":"info","message":"95th-percentile length under 20 chars"},{"code":"duplicates","level":"warn","message":"72.3% duplicate strings"}],"column":"wikidata","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[10819,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,5,0,0,0,94,0,0,0,1167,0,0,0,2574,0,0,805],"edges":[0.0,0.25,0.5,0.75,1.0,1.25,1.5,1.75,2.0,2.25,2.5,2.75,3.0,3.25,3.5,3.75,4.0,4.25,4.5,4.75,5.0,5.25,5.5,5.75,6.0,6.25,6.5,6.75,7.0,7.25,7.5,7.75,8.0,8.25,8.5,8.75,9.0,9.25,9.5,9.75,10.0]},"near_unique":false,"sample":["","","Q253241","Q125484975","","Q16377805","Q19834685","","","Q17325138","","","Q122211196","","Q122178910","","","","Q122178766","","Q3034091","Q1665508","","","","","","","","Q122211085","Q28913713","Q27479027","Q120638108","","","","Q1529774","","","Q1804880","","Q30130655","Q22966736","","Q47491990","","Q66114150","","","Q122178868"],"top_values":[["",10819],["Q106546933",17],["Q1917052",13],["Q28051811",13],["Q97602812",13],["Q1917047",11],["Q950572",9],["Q19834685",9],["Q1404118",8],["Q1549706",8],["Q1549712",7],["Q1548109",7],["Q15526221",7],["Q65952676",6],["Q1549707",6],["Q1490556",5],["Q65237379",5],["Q65318652",5],["Q240198",5],["Q3034142",5]],"top_words":[["q106546933",17],["q1917052",13],["q28051811",13],["q97602812",13],["q1917047",11],["q950572",9],["q19834685",9],["q1404118",8],["q1549706",8],["q1549712",7],["q1548109",7],["q15526221",7],["q65952676",6],["q1549707",6],["q1490556",5],["q65237379",5],["q65318652",5],["q240198",5],["q3034142",5],["q29912887",5],["q832458",4],["q65237336",4],["q65095924",4],["q1652332",4],["q1549689",4]],"vocab_skipped":null,"word_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,15464,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[0.5,0.5333333333333333,0.5666666666666667,0.6,0.6333333333333333,0.6666666666666666,0.7,0.7333333333333334,0.7666666666666666,0.8,0.8333333333333333,0.8666666666666667,0.9,0.9333333333333333,0.9666666666666667,1.0,1.0333333333333332,1.0666666666666667,1.1,1.1333333333333333,1.1666666666666665,1.2,1.2333333333333334,1.2666666666666666,1.3,1.3333333333333335,1.3666666666666667,1.4,1.4333333333333333,1.4666666666666668,1.5]}},"kind":"text","n":15464,"n_null":0,"n_unique":4289,"null_rate":0.0,"stats":{"allcaps_rate":0.3003750646663218,"boilerplate_rate":0.0,"duplicate_rate":0.722646145887222,"emoji_rate":0.0,"len_max":10,"len_mean":2.6668391101914124,"len_median":0.0,"len_min":0,"len_p95":10.0,"n_duplicates":11175,"n_empty":10819,"one_word_rate":1.0,"readability_flesch_mean":38.790400000000005,"url_rate":0.0,"vocab_size":4288,"word_mean":1.0,"word_median":1.0}},{"alerts":[],"column":"heritage","extras":{"singletons":3,"top_values":[["",13602],["2",1264],["3",205],["1",120],["yes",109],["no",69],["Em Vias de Classifica\u00e7\u00e3o",60],["4",24],["7",8],["Scheduled Monument",1],["6",1],["M0021",1]]},"kind":"categorical","n":15464,"n_null":0,"n_unique":12,"null_rate":0.0,"stats":{"cardinality":12,"entropy":0.7343277435721365,"entropy_ratio":0.2048355438653593,"top_rate":0.8795913088463528,"top_value":""}},{"alerts":[],"column":"heritage_operator","extras":{"singletons":8,"top_values":[["",13848],["mhs",960],["IE:smr",229],["dgpc",185],["pc",103],["rce",23],["Historic Environment Scotland",18],["cadw",14],["whc",14],["lda",12],["nld",9],["IE:smr;IE:nm",8],["he",6],["Cadw",5],["mecd",4],["DGPC",3],["IE:smr:IE:nm",3],["alsh",2],["hs",2],["raa",2]]},"kind":"categorical","n":15464,"n_null":0,"n_unique":31,"null_rate":0.0,"stats":{"cardinality":31,"entropy":0.7028371746814511,"entropy_ratio":0.14186704172539466,"top_rate":0.8954992240041386,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"21 singleton categories"},{"code":"imbalance","level":"warn","message":"top value is 99.8% of rows"}],"column":"start_date","extras":{"singletons":21,"top_values":[["",15430],["1999",5],["C-30",4],["~2000 BC",2],["between 3500 and 2800 BCE",2],["2900 BC..2600 BC",1],["-3000 BC",1],["-2000",1],["2004-07-01",1],["before -3250",1],["3720 BC",1],["2800-2200 BC",1],["~5000 BCE",1],["~C30 BC",1],["2000 BC",1],["Mittelneolithikum (2350 - 2150 v. u. Z.)",1],["1500 BC",1],["2800 BC..2200 BC",1],["2012-04-30",1],["3100 BC",1]]},"kind":"categorical","n":15464,"n_null":0,"n_unique":26,"null_rate":0.0,"stats":{"cardinality":26,"entropy":0.03223960869772837,"entropy_ratio":0.0068588495185463935,"top_rate":0.997801345059493,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"7 singleton categories"},{"code":"imbalance","level":"warn","message":"top value is 98.4% of rows"}],"column":"material","extras":{"singletons":7,"top_values":[["",15223],["stone",196],["granite",29],["sandstone",5],["limestone",2],["dry_stone",2],["Quarzit",1],["reinforced_concrete",1],["stone;concrete",1],["basalt",1],["quartz_blanc",1],["granit",1],["andesite",1]]},"kind":"categorical","n":15464,"n_null":0,"n_unique":13,"null_rate":0.0,"stats":{"cardinality":13,"entropy":0.132559405724456,"entropy_ratio":0.035822609154959266,"top_rate":0.9844154164511123,"top_value":""}}],"insights":{"errors":[],"insights":[{"confidence":"high","critiques":[],"evidence_keys":["row_count","column_count","megalith_type.top_values","megalith_type.stats.top_rate","description.stats.top_rate","material.stats.top_rate","wikidata.stats.n_empty","lat.stats.median","lat.stats.skew","lon.stats.median","lon.stats.skew","lon.stats.outlier_rate","heritage.top_values","type.top_values"],"featured_charts":[{"caption":"Look for how dominated the dataset is by menhirs and dolmens, and which rarer types (nuraghes, stone circles, passage graves) still have enough records to analyse separately.","column":"megalith_type","kind":"bar"},{"caption":"The strong negative skew reveals that most megaliths cluster in a narrow Northern European band, with a sparse tail of southern and non-European outliers worth investigating.","column":"lat","kind":"histogram"},{"caption":"High positive skew and a 4.4% outlier rate in longitude flag sites far outside Western Europe \u2014 check whether these are data errors or genuinely remote monuments.","column":"lon","kind":"histogram"},{"caption":"Only about 12% of sites carry any heritage designation; look at which designation levels (1, 2, 3) are most common among those that do.","column":"heritage","kind":"bar"},{"caption":"Among the minority of sites with a heritage operator, 'mhs' (France) and 'IE:smr' (Ireland) dominate \u2014 revealing which countries have contributed the most structured heritage data.","column":"heritage_operator","kind":"bar"}],"model":"anthropic:default","narrative":"This dataset catalogues 15,464 megalithic structures (dolmens, menhirs, stone circles, nuraghes, and more) drawn from OpenStreetMap, with geographic coordinates, heritage classification, and typology fields. The most striking pattern is extreme sparsity in descriptive metadata: over 95% of records have no description, 98.5% have no material recorded, and roughly 70% lack a Wikidata link, suggesting the dataset is geographically rich but editorially thin. The megalith_type column is the most informative categorical field, splitting meaningfully across menhirs (5,231), dolmens (4,501), nuraghes (1,080), and stone circles (1,011). Geographically, the bulk of sites cluster in Western Europe (median latitude ~47.6\u00b0N, median longitude ~-1.6\u00b0), but high skew and outliers in both lat and lon indicate a long tail of sites in places like Sardinia, Iberia, Ireland, and beyond \u2014 worth mapping.","scope":"dataset","target":"__global__"},{"confidence":"high","critiques":[],"evidence_keys":["column","n","n_unique","null_rate","stats.n_empty","stats.duplicate_rate","stats.n_duplicates","stats.allcaps_rate","top_values"],"model":"anthropic:default","narrative":"This column stores Wikidata entity identifiers (Q-codes) linking dataset rows to Wikidata knowledge-base entries. Two signals demand immediate attention: 10,819 of 15,464 rows (70%) are empty strings rather than true nulls, and the duplicate_rate is 0.723, meaning many rows share the same Q-code \u2014 the top value 'Q106546933' appears 17 times, suggesting a many-to-one entity mapping. The allcaps_rate of 0.300 reflects the uppercase 'Q' prefix on valid codes.","role":"foreign_key","scope":"column","target":"wikidata","treatment":"Replace empty strings with null, then left-join on this Q-code to enrich with Wikidata properties; expect a many-to-one join given high duplicate rate."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.n_empty","stats.duplicate_rate","stats.n_duplicates","stats.one_word_rate","stats.word_mean","top_values","top_words"],"model":"anthropic:default","narrative":"This column contains the local or common name of prehistoric megalithic monuments (dolmens, menhirs, stone circles, nuraghes, etc.), drawing from a multilingual dataset spanning at least English, French, Russian (Cyrillic), and German. Two signals stand out: 30.5% of rows (4,720 of 15,464) are empty strings rather than true nulls, and the duplicate rate is 36.2% (5,595 duplicates), largely driven by generic type-names like '\u0414\u043e\u043b\u043c\u0435\u043d' (191), 'Dolmen' (51), 'Menhir' (50), and 'Standing Stone' (48) being reused across many distinct monuments. The one-word rate of 37.8% and word mean of ~2.5 are consistent with short monument names, but the 4,720 empty strings should be treated as missing values.","role":"label","scope":"column","target":"name","treatment":"Replace empty strings with NaN, then use as a descriptive label or weak text feature; do not treat as a unique identifier due to 36% duplicate rate and multilingual generic names."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","n_empty","duplicate_rate","n_duplicates","top_values","top_words","one_word_rate","len_max","len_mean"],"model":"anthropic:default","narrative":"This column stores Wikipedia article references in a 'language-code:article-title' format (e.g., 'de:Gro\u00dfsteingr\u00e4ber im Haldensleber Forst'), linking dataset records to corresponding Wikipedia pages across multiple languages including German, French, Catalan, Portuguese, and English. The dominant surprise is that 13,060 of 15,464 rows (84.5%) are empty strings, meaning most records have no Wikipedia link at all. Among populated values, 13,406 duplicates exist because the same Wikipedia article is referenced by multiple records \u2014 consistent with grouped/list articles covering many individual megalithic sites. The multi-language mix (de, fr, pt, ca, en prefixes visible) is expected for a multilingual cultural-heritage dataset.","role":"metadata","scope":"column","target":"wikipedia","treatment":"Parse language prefix and article slug into separate fields; treat empty strings as nulls; use as an optional enrichment join key rather than a model feature."},{"confidence":"high","critiques":[],"evidence_keys":["top_value","top_rate","n","n_unique","entropy_ratio","top_values","alerts"],"model":"anthropic:default","narrative":"This column is a text description field for archaeological or heritage site records, containing short labels or names of megalithic structures (e.g., 'J\u00e6ttestue', 'Gro\u00dfsteingrab', 'Dolmen', 'Stone circle') in multiple languages including Danish, German, Portuguese, and English. The most striking signal is that 95.8% of the 15,464 rows (14,814) carry an empty string, effectively making the field near-empty at scale. The remaining 586 distinct non-empty values are heavily long-tailed, with the most frequent non-empty value ('J\u00e6ttestue') appearing only 11 times. The entropy ratio of 0.069 confirms extreme imbalance driven by the dominant empty-string value.","role":"free_text","scope":"column","target":"description","treatment":"Treat empty strings as missing; for non-null values, consider as a sparse categorical label or tokenize and embed for similarity/search use cases."},{"confidence":"high","critiques":[],"evidence_keys":["top_value","top_rate","cardinality","entropy","null_rate","n","top_values","alerts"],"model":"anthropic:default","narrative":"This column captures the construction or surface material of a physical feature (likely a wall, path, or structure in a geospatial dataset), with 13 distinct values across 15,464 rows. The dominant 'value' is an empty string, accounting for 98.44% of all records \u2014 meaning the field is effectively unpopulated for the vast majority of entries, despite a null_rate of 0.0. The remaining 241 non-empty records span stone-type materials (stone, granite, sandstone, limestone, etc.), with a minor language inconsistency ('Quarzit' appearing in German). Entropy is extremely low (0.133) confirming near-total dominance of the blank value.","role":"feature","scope":"column","target":"material","treatment":"Treat empty string as missing; recode to NaN, then consider a binary 'has_material' flag or impute/drop depending on task, given 98.44% missingness."},{"confidence":"high","critiques":[],"evidence_keys":["top_rate","top_value","n","n_unique","null_rate","entropy","top_values","alerts"],"model":"anthropic:default","narrative":"This column is intended to capture a start date for records, but it is overwhelmingly empty: 15,430 of 15,464 rows (99.78%) contain a blank string, making it nearly useless as a feature. The 34 non-empty values are highly heterogeneous \u2014 mixing ISO dates ('2004-07-01'), calendar years ('1999'), approximate historical dates ('~2000 BC'), ranges ('between 3500 and 2800 BCE'), negative year offsets ('-3000 BC'), and even a code-like value ('C-30') \u2014 indicating no enforced format or schema. The extreme imbalance (top_rate 0.998) and near-zero entropy (0.032) confirm the column carries almost no information signal.","role":"metadata","scope":"column","target":"start_date","treatment":"Drop from modelling due to 99.78% blank rate; if historical context is needed, parse and normalise the 34 non-blank values manually before any use."},{"confidence":"high","critiques":[],"evidence_keys":["top_value","top_rate","n_unique","entropy_ratio","n","null_rate"],"model":"anthropic:default","narrative":"This column classifies archaeological monument types, with 19 distinct categories across 15,464 records and no nulls. It is severely imbalanced: 'megalith' dominates at 97.73% of all records (15,113), leaving the remaining 18 types \u2014 menhir, dolmen, standing_stone, stone_circle, nuraghe, etc. \u2014 sharing just 351 records. The entropy ratio of 0.049 confirms near-total concentration in one class, which will severely impair any multi-class model trained on this label.","role":"label","scope":"column","target":"type","treatment":"Treat as a severely imbalanced categorical label; apply oversampling (SMOTE) or class-weighted losses if used as a target, or collapse rare types into an 'other' bucket for feature use."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","mean","median","q1","q3","iqr","skew","kurtosis","n_outliers","outlier_rate","n_unique","n","null_rate"],"model":"anthropic:default","narrative":"This column contains geographic latitude values, ranging from -51.81\u00b0 to 65.17\u00b0, almost certainly representing the latitude coordinate of geolocated records. The vast majority of values cluster in the 43\u00b0\u201351\u00b0 band (IQR of ~7.6\u00b0), suggesting heavy concentration in mid-latitude Europe or North America. The negative skew of -3.09 and extreme kurtosis of 26.33 indicate a sharp central peak with a long left tail \u2014 a surprising number of records pull toward lower or even southern-hemisphere latitudes, captured in 134 flagged outliers (~0.87%). Near-uniqueness (15,320 unique out of 15,464 rows) is expected for precise coordinate data.","role":"feature","scope":"column","target":"lat","treatment":"Use as-is or pair with longitude for spatial analysis; investigate the 134 outliers for data-entry errors or genuine remote locations before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","mean","median","skew","kurtosis","iqr","q1","q3","n_outliers","outlier_rate","alerts"],"model":"anthropic:default","narrative":"This column represents geographic longitude values, with readings spanning from -151.36 to 144.74 degrees \u2014 a plausible global range. What is surprising is the severe positive skew (3.65) and extreme kurtosis (34.34), indicating the distribution is heavily concentrated in a narrow band (IQR of only 11.53, centred around Western Europe/Africa longitudes near 0\u00b0) with 676 outliers (4.37%) pulled far to the east and west. The mean (2.62) and median (-1.62) diverge noticeably, confirming the asymmetric clustering, likely reflecting a dataset dominated by European locations with a long tail of global outliers.","role":"feature","scope":"column","target":"lon","treatment":"Retain as-is for geo-spatial modelling; investigate and potentially stratify or cap the 676 outlier records before distance-based or regression analyses."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.skew","stats.iqr","stats.n_outliers"],"model":"anthropic:default","narrative":"This column is a numeric row identifier \u2014 every one of the 15,464 rows carries a distinct value with zero nulls, confirming it functions as a unique primary key. The values are large integers spanning roughly 24 million to 13.5 billion, which is consistent with a distributed-system or database auto-increment ID rather than a sequential integer index. Mild positive skew (0.89) and a wide IQR (~4.5 billion) suggest IDs were assigned non-uniformly over time or across sources, but no outliers are flagged.","role":"identifier","scope":"column","target":"id","treatment":"Retain as a join/lookup key; exclude from any feature matrix or model input."},{"confidence":"medium","critiques":[],"evidence_keys":["top_value","top_rate","n_unique","null_rate","top_values","cardinality"],"model":"anthropic:default","narrative":"This column represents a heritage classification or designation status for records, likely a regulatory or cultural heritage grading field. The dominant 'value' is an empty string, which accounts for 87.96% of all 15,464 rows, indicating that most records carry no heritage designation. The remaining values are a heterogeneous mix of numeric grades (1\u20134, 7), boolean-style strings ('yes', 'no'), a Portuguese classification phrase ('Em Vias de Classifica\u00e7\u00e3o'), and a single 'Scheduled Monument' entry \u2014 suggesting the column was populated from multiple source systems or locales with no enforced vocabulary.","role":"label","scope":"column","target":"heritage","treatment":"Treat empty strings as a distinct 'undesignated' category; harmonise numeric grades, boolean strings, and foreign-language values into a unified controlled vocabulary before encoding."},{"confidence":"high","critiques":[],"evidence_keys":["top_value","top_rate","n_unique","cardinality","entropy_ratio","top_values","null_rate"],"model":"anthropic:default","narrative":"This column identifies the heritage operator or authority responsible for a record, with 31 distinct coded values across 15,464 rows. The dominant 'value' is an empty string, accounting for 89.5% of all rows (13,848), meaning the vast majority of records have no operator assigned \u2014 this blank dominance severely suppresses the entropy ratio to 0.14. Among the 30 non-empty values, 'mhs' (960), 'IE:smr' (229), and 'dgpc' (185) are the most common, suggesting a mix of abbreviated authority codes and occasional full names (e.g., 'Historic Environment Scotland'), indicating inconsistent formatting across sources.","role":"label","scope":"column","target":"heritage_operator","treatment":"Treat empty string as missing; normalise authority codes to a consistent controlled vocabulary before using as a categorical feature or grouping key."},{"confidence":"high","critiques":[],"evidence_keys":["top_values","top_rate","n_unique","null_rate","entropy_ratio","n"],"model":"anthropic:default","narrative":"This column classifies prehistoric stone monuments into structural types, with 73 distinct categories across 15,464 records and no nulls. The dominant class is 'menhir' (5,231 records, ~33.8%), followed closely by 'dolmen' (4,501), meaning these two types together account for over 60% of all rows \u2014 a moderate concentration reflected in an entropy ratio of 0.44. Notably, the third most frequent value is an empty string ('') with 1,714 occurrences (~11.1%), which masquerades as a non-null entry and represents a meaningful data quality issue that null_rate alone does not capture.","role":"label","scope":"column","target":"megalith_type","treatment":"Recode empty-string entries as explicit nulls or an 'unknown' category, then one-hot or target-encode for modelling given 73 categories and moderate class imbalance."},{"confidence":"high","critiques":[],"evidence_keys":["n_unique","null_rate","top_value","top_rate","top_values","entropy"],"model":"anthropic:default","narrative":"This column encodes the OpenStreetMap geometry type, distinguishing between point features ('node') and linear/polygon features ('way'). With only 2 distinct values across 15,464 rows and zero nulls, it is a clean binary flag. The distribution is heavily skewed: 'node' dominates at 86.1% (13,311 records) versus 'way' at just 13.9% (2,153 records). The low entropy of 0.582 confirms the imbalance, which may matter if 'way' features behave differently in downstream models.","role":"feature","scope":"column","target":"osm_type","treatment":"Binary-encode (node=1, way=0) and monitor class imbalance if used as a feature or stratification variable."}],"providers":["anthropic:default"],"total_usage":{"completion_tokens":4619,"prompt_tokens":15604,"total_tokens":20223}},"language_counts":{},"meta":{"generated_at":"2026-06-22T00:36:07+00:00","mode":"full","row_count":15464,"sampled_rows":15464,"seed":42,"source":"/home/coolhand/html/datavis/data_trove/data/quirky/megaliths.json"},"notes":[],"saturn_version":"0.2.0","schema":{"description":"categorical","heritage":"categorical","heritage_operator":"categorical","id":"numeric","lat":"numeric","lon":"numeric","material":"categorical","megalith_type":"categorical","name":"text","osm_type":"categorical","start_date":"categorical","type":"categorical","wikidata":"text","wikipedia":"text"}}
