{"columns":[{"alerts":[{"code":"near_unique","level":"info","message":"100.0% of rows are unique strings"},{"code":"one_word","level":"warn","message":"100.0% rows are a single word"},{"code":"allcaps","level":"info","message":"100.0% rows are all-caps"},{"code":"short_text","level":"info","message":"95th-percentile length under 20 chars"}],"column":"PeopleID3ROG3","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,7124,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[6.5,6.525,6.55,6.575,6.6,6.625,6.65,6.675,6.7,6.725,6.75,6.775,6.8,6.825,6.85,6.875,6.9,6.925,6.95,6.975,7.0,7.025,7.05,7.075,7.1,7.125,7.15,7.175,7.2,7.225,7.25,7.275,7.3,7.325,7.35,7.375,7.4,7.425,7.45,7.475,7.5]},"near_unique":true,"sample":["10375CE","21769IN","14244NI","10824PU","16828IN","18274LY","17080NP","22370NI","10949CM","13819NO","19198BT","17745IN","18615CH","10376MU","19808CH","21571BR","10161US","11988SU","19007KG","16620IN","11478BT","13922AG","12347UK","11317FR","21128IN","22047PK","17937IN","10584RP","12054CA","18274TU","20032PK","20236IN","20235PK","16501IN","16278IN","16944BG","20610CH","17590PK","17067IN","17721IN","10391SU","18628CH","18577CH","18617CH","14039MG","20631GG","15382GM","16514NP","10839AJ","16100BN"],"top_values":[],"top_words":[["10208ng",1],["10301su",1],["10375tz",1],["10375up",1],["10376ae",1],["10376ca",1],["10375as",1],["10375bu",1],["10375ce",1],["10375cg",1],["10375gb",1],["10375hu",1],["10375id",1],["10375ke",1],["10375mk",1],["10375my",1],["10375pk",1],["10375rp",1],["10375sl",1],["10375so",1],["10376eg",1],["10376ir",1],["10376iz",1],["10376ku",1],["10376mu",1]],"vocab_skipped":null,"word_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,7124,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[0.5,0.5333333333333333,0.5666666666666667,0.6,0.6333333333333333,0.6666666666666666,0.7,0.7333333333333334,0.7666666666666666,0.8,0.8333333333333333,0.8666666666666667,0.9,0.9333333333333333,0.9666666666666667,1.0,1.0333333333333332,1.0666666666666667,1.1,1.1333333333333333,1.1666666666666665,1.2,1.2333333333333334,1.2666666666666666,1.3,1.3333333333333335,1.3666666666666667,1.4,1.4333333333333333,1.4666666666666668,1.5]}},"kind":"text","n":7124,"n_null":0,"n_unique":7124,"null_rate":0.0,"stats":{"allcaps_rate":1.0,"boilerplate_rate":0.0,"duplicate_rate":0.0,"emoji_rate":0.0,"len_max":7,"len_mean":7.0,"len_median":7.0,"len_min":7,"len_p95":7.0,"n_duplicates":0,"n_empty":0,"one_word_rate":1.0,"readability_flesch_mean":112.33700000000003,"url_rate":0.0,"vocab_size":7124,"word_mean":1.0,"word_median":1.0}},{"alerts":[],"column":"ROG3","extras":{"singletons":35,"top_values":[["IN",2032],["PK",767],["CH",442],["BG",256],["ID",234],["NP",184],["SU",168],["LA",142],["RS",115],["US",90],["IR",85],["CD",81],["MY",78],["TH",73],["VM",69],["TU",61],["BM",59],["AF",58],["CE",55],["CA",52]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":202,"null_rate":0.0,"stats":{"cardinality":202,"entropy":5.058444860597964,"entropy_ratio":0.660525616456381,"top_rate":0.2852330151600225,"top_value":"IN"}},{"alerts":[],"column":"PeopleID3","extras":{"histogram":{"counts":[131,123,167,106,123,108,168,196,140,128,131,93,71,212,96,178,223,170,53,233,231,221,238,314,274,255,272,236,278,164,160,174,205,92,106,254,189,115,295,201],"edges":[10120.0,10433.525,10747.05,11060.575,11374.1,11687.625,12001.15,12314.675,12628.2,12941.725,13255.25,13568.775,13882.3,14195.825,14509.349999999999,14822.875,15136.4,15449.925,15763.45,16076.974999999999,16390.5,16704.025,17017.55,17331.075,17644.6,17958.125,18271.65,18585.175,18898.699999999997,19212.225,19525.75,19839.275,20152.8,20466.324999999997,20779.85,21093.375,21406.9,21720.425,22033.949999999997,22347.475,22661.0]},"sample":[10378.0,10379.0,10379.0,10572.0,11197.0,12029.0,12065.0,12247.0,12247.0,12247.0,12368.0,12368.0,13169.0,13483.0,13819.0,13819.0,13842.0,14639.0,14715.0,14911.0,14911.0,15484.0,15946.0,20327.0,20593.0,22659.0,12145.0,12322.0,12322.0,18398.0,18425.0,18557.0,18606.0,18648.0,18705.0,20515.0,20625.0,10161.0,10495.0,10953.0,10953.0,10953.0,11317.0,12952.0,13049.0,18765.0,18765.0,18997.0,21310.0,21363.0,14883.0,14983.0,14983.0,19603.0,19651.0,21539.0,21548.0,21842.0,10591.0,11126.0,12877.0,12877.0,12877.0,12877.0,12877.0,14322.0,14324.0,14371.0,14371.0,14461.0,15201.0,15220.0,15866.0,18693.0,18858.0,20455.0,20542.0,11661.0,11764.0,12346.0,12350.0,12374.0,14451.0,16021.0,16067.0,19247.0,20824.0,21846.0,11402.0,12166.0,18869.0,19143.0,19323.0,21613.0,21650.0,10140.0,10795.0,10933.0,11837.0,12318.0,12602.0,12680.0,13437.0,14465.0,14511.0,15335.0,15956.0,19029.0,19545.0,19812.0,20295.0,12868.0,10243.0,10419.0,11277.0,11277.0,13705.0,14061.0,14377.0,14586.0,15192.0,15194.0,15205.0,15361.0,15460.0,16028.0,18466.0,18486.0,18566.0,18589.0,18682.0,18690.0,18888.0,19578.0,19592.0,19799.0,19808.0,21066.0,21646.0,22602.0,22607.0,22614.0,22615.0,22618.0,10790.0,10790.0,11595.0,11982.0,11982.0,12027.0,12329.0,12410.0,12486.0,12558.0,12771.0,13317.0,13317.0,13317.0,14042.0,14196.0,14300.0,14327.0,14483.0,14483.0,14732.0,15034.0,15498.0,15727.0,16162.0,16172.0,16187.0,16217.0,16243.0,16307.0,16313.0,16325.0,16332.0,16338.0,16404.0,16406.0,16419.0,16496.0,16518.0,16521.0,16538.0,16585.0,16643.0,16665.0,16684.0,16703.0,16725.0,16742.0,16750.0,16755.0,16757.0,16762.0,16771.0,16779.0,16799.0,16808.0,16811.0,16839.0,16848.0,16902.0,16904.0,16905.0,16922.0,16924.0,16934.0,16940.0,16947.0,16960.0,16973.0,17080.0,17010.0,17035.0,17039.0,17041.0,17061.0,17066.0,17105.0,17110.0,17124.0,17131.0,17158.0,17238.0,17251.0,17268.0,17301.0,17314.0,17316.0,17352.0,17379.0,17381.0,17391.0,17400.0,17407.0,17417.0,17418.0,17419.0,17432.0,17463.0,17510.0,17520.0,17527.0,17538.0,17571.0,17584.0,17590.0,17597.0,17620.0,17622.0,17639.0,17672.0,17684.0,17707.0,17735.0,17740.0,17743.0,17744.0,17755.0,17763.0,17767.0,17770.0,17778.0,17786.0,17824.0,17840.0,17843.0,17853.0,17858.0,17877.0,17903.0,17961.0,17993.0,18012.0,18046.0,18054.0,18061.0,18104.0,18140.0,18144.0,18165.0,18216.0,18305.0,18309.0,18327.0,18332.0,18337.0,18795.0,19069.0,19082.0,19194.0,19199.0,19211.0,19211.0,19211.0,19211.0,19268.0,19279.0,19655.0,19688.0,19724.0,19779.0,19821.0,19825.0,19825.0,19839.0,19858.0,19859.0,19899.0,19931.0,19937.0,19949.0,19956.0,19965.0,19974.0,19987.0,20000.0,20006.0,20013.0,20057.0,20209.0,20211.0,20218.0,20232.0,20238.0,20252.0,20344.0,20346.0,20373.0,20387.0,20394.0,20401.0,20442.0,21122.0,20982.0,21015.0,21025.0,21035.0,21105.0,21114.0,21139.0,21149.0,21216.0,21226.0,21238.0,21239.0,21255.0,21259.0,21317.0,21329.0,21356.0,21371.0,21398.0,21477.0,21479.0,21485.0,21487.0,21496.0,21499.0,21500.0,21518.0,21519.0,21535.0,21537.0,21587.0,21622.0,21703.0,21711.0,21725.0,21730.0,21737.0,21747.0,21772.0,21788.0,21806.0,21810.0,21812.0,21813.0,21816.0,21825.0,22052.0,22085.0,22086.0,22096.0,22143.0,22156.0,22165.0,22189.0,22194.0,22199.0,22205.0,22206.0,22208.0,22219.0,22241.0,22267.0,22276.0,22282.0,22302.0,22339.0,22348.0,22350.0,22443.0,22448.0,22492.0,10386.0,10617.0,10636.0,10976.0,11189.0,11292.0,11533.0,11588.0,11884.0,11925.0,12509.0,12711.0,13230.0,13511.0,13844.0,14355.0,14996.0,14996.0,15014.0,15145.0,15145.0,15161.0,15277.0,15365.0,15411.0,15414.0,15530.0,15626.0,18862.0,18907.0,21008.0,22357.0,22466.0,15468.0,15468.0,16151.0,18462.0,18599.0,18515.0,18535.0,18536.0,18555.0,18576.0,18640.0,18652.0,18655.0,18671.0,18684.0,18688.0,18731.0,18886.0,18886.0,19250.0,20613.0,20945.0,10205.0,10528.0,12599.0,12599.0,12933.0,13962.0,13962.0,14409.0,14498.0,15070.0,15284.0,15668.0,15755.0,15755.0,15755.0,18274.0,18389.0,18736.0,18721.0,21654.0,19007.0,19007.0,19007.0,19007.0,19007.0,19007.0,19007.0,19007.0,19007.0,19007.0,19007.0,19007.0,19007.0,19007.0,19007.0,19007.0,19007.0,19007.0]},"kind":"numeric","n":7124,"n_null":0,"n_unique":4614,"null_rate":0.0,"stats":{"iqr":5250.75,"kurtosis":-0.9527844427376593,"max":22661.0,"mean":16933.848680516563,"median":17356.5,"min":10120.0,"n_outliers":0,"outlier_rate":0.0,"q1":14328.5,"q3":19579.25,"skew":-0.22552586229683574,"std":3430.7695606125712,"zero_rate":0.0}},{"alerts":[],"column":"ROP3","extras":{"histogram":{"counts":[133,97,107,139,94,89,86,153,155,105,89,137,141,102,66,79,162,100,83,263,152,111,127,342,277,300,418,364,340,169,324,236,360,71,72,39,263,332,67,373],"edges":[100005.0,100495.35,100985.7,101476.05,101966.4,102456.75,102947.1,103437.45,103927.8,104418.15,104908.5,105398.85,105889.2,106379.55,106869.9,107360.25,107850.6,108340.95,108831.3,109321.65,109812.0,110302.35,110792.7,111283.05,111773.4,112263.75,112754.1,113244.45,113734.8,114225.15,114715.5,115205.85,115696.2,116186.55,116676.9,117167.25,117657.6,118147.95,118638.3,119128.65,119619.0]},"sample":[100431.0,100226.0,100226.0,100772.0,103010.0,103630.0,103715.0,104056.0,104056.0,104056.0,104301.0,104301.0,105948.0,106221.0,106804.0,106804.0,106837.0,108512.0,108627.0,108942.0,108945.0,110053.0,110474.0,116046.0,116912.0,117090.0,103902.0,104189.0,104189.0,114832.0,114020.0,114174.0,114226.0,114269.0,114350.0,116330.0,116867.0,100079.0,100852.0,101629.0,101629.0,101629.0,102059.0,105583.0,105742.0,114431.0,114431.0,115399.0,118146.0,118183.0,109392.0,109392.0,109392.0,108538.0,115403.0,118347.0,118358.0,119008.0,113266.0,101922.0,105458.0,105458.0,105458.0,105458.0,105458.0,107901.0,107906.0,107987.0,107987.0,108647.0,109733.0,109766.0,110917.0,103535.0,114716.0,116305.0,116135.0,103063.0,103299.0,117322.0,104313.0,104318.0,108133.0,111108.0,111222.0,104314.0,118621.0,119603.0,102327.0,105247.0,114896.0,114985.0,115242.0,118405.0,110988.0,100036.0,115051.0,101679.0,103309.0,104156.0,104863.0,105020.0,106144.0,108173.0,108294.0,109949.0,112316.0,115257.0,108799.0,116015.0,106070.0,105528.0,100487.0,100487.0,101940.0,101940.0,106686.0,107510.0,107515.0,108011.0,108436.0,109720.0,109722.0,109758.0,110776.0,109994.0,111090.0,114075.0,114096.0,114183.0,114209.0,109710.0,114321.0,114836.0,115091.0,115224.0,114998.0,108601.0,106270.0,118428.0,119578.0,119518.0,119536.0,119545.0,119537.0,101254.0,101254.0,102831.0,103544.0,103544.0,103789.0,104555.0,104555.0,104555.0,104795.0,105243.0,107204.0,107217.0,107217.0,109027.0,109305.0,109502.0,108182.0,108182.0,108182.0,108730.0,109523.0,110423.0,110423.0,111274.0,111277.0,111292.0,111334.0,111372.0,111442.0,111445.0,111463.0,111469.0,111477.0,111553.0,111556.0,111573.0,111671.0,111696.0,111700.0,111726.0,111783.0,111857.0,111883.0,111919.0,111941.0,111968.0,111989.0,111999.0,112006.0,112009.0,112021.0,112034.0,112044.0,112063.0,112065.0,112074.0,112082.0,112124.0,112132.0,112198.0,112199.0,112202.0,112222.0,112226.0,112242.0,112247.0,112254.0,112271.0,112288.0,112418.0,112339.0,112373.0,112377.0,112379.0,112403.0,112404.0,112450.0,112451.0,112457.0,112470.0,112488.0,112509.0,112608.0,112628.0,112639.0,112680.0,112696.0,112698.0,112740.0,112774.0,112781.0,112789.0,112801.0,112808.0,112819.0,112820.0,112820.0,112835.0,112873.0,112926.0,112941.0,112949.0,112963.0,112998.0,113015.0,113020.0,113030.0,113057.0,113057.0,113075.0,113116.0,113131.0,113158.0,113194.0,113199.0,113203.0,113215.0,113224.0,113229.0,113235.0,113245.0,113254.0,113298.0,113314.0,113318.0,113330.0,113335.0,113354.0,113384.0,113451.0,113486.0,113507.0,113546.0,113553.0,113561.0,113608.0,113651.0,113653.0,113677.0,113743.0,113852.0,113855.0,113879.0,113882.0,113884.0,113889.0,114488.0,115336.0,111279.0,113801.0,115528.0,115527.0,115527.0,115527.0,115527.0,115325.0,115550.0,112187.0,115140.0,115177.0,115849.0,115859.0,115860.0,115869.0,115873.0,115874.0,115893.0,115701.0,115711.0,115725.0,115732.0,115742.0,115755.0,115772.0,115910.0,115915.0,115921.0,115767.0,115966.0,115702.0,115748.0,115976.0,115982.0,100894.0,116127.0,116130.0,116157.0,116171.0,116178.0,116185.0,116225.0,117945.0,117706.0,117866.0,117876.0,117885.0,117928.0,117937.0,117961.0,117972.0,118038.0,118048.0,118061.0,118062.0,118078.0,118081.0,118151.0,118155.0,118180.0,118182.0,118203.0,118293.0,118295.0,115212.0,118304.0,118320.0,117184.0,118329.0,118321.0,118338.0,116298.0,117687.0,118414.0,118490.0,118499.0,118512.0,118517.0,118523.0,118534.0,118559.0,118575.0,118593.0,118596.0,118597.0,118598.0,118600.0,118602.0,118610.0,119066.0,119095.0,119096.0,119106.0,119160.0,119173.0,119182.0,119206.0,119212.0,119216.0,119222.0,119223.0,119225.0,119237.0,119259.0,119285.0,119295.0,119301.0,119114.0,112887.0,119347.0,119349.0,119425.0,117670.0,111658.0,100437.0,100925.0,100925.0,101648.0,101820.0,101970.0,102513.0,102625.0,103311.0,103420.0,104604.0,105010.0,106010.0,106266.0,106841.0,107773.0,109404.0,109413.0,109426.0,109644.0,109644.0,109644.0,109768.0,110780.0,110786.0,110856.0,110075.0,110257.0,114613.0,114850.0,117720.0,118453.0,119445.0,110033.0,110033.0,111073.0,114063.0,114162.0,114124.0,114151.0,114157.0,114191.0,114194.0,114259.0,114258.0,114274.0,114295.0,114305.0,114313.0,114363.0,114381.0,114830.0,115322.0,116905.0,116911.0,119541.0,100675.0,104791.0,104791.0,105403.0,107064.0,107376.0,107686.0,108219.0,109520.0,109874.0,110306.0,110469.0,113818.0,113818.0,113982.0,114302.0,114344.0,114916.0,114916.0,114916.0,114916.0,114916.0,114916.0,114916.0,114916.0,114916.0,114916.0,114916.0,114916.0,114916.0,114916.0,114916.0,114916.0,114916.0,114916.0]},"kind":"numeric","n":7124,"n_null":7,"n_unique":4608,"null_rate":0.0009825940482874789,"stats":{"iqr":7339.0,"kurtosis":-0.7272864543722006,"max":119619.0,"mean":111443.67542503864,"median":112533.0,"min":100005.0,"n_outliers":0,"outlier_rate":0.0,"q1":107901.0,"q3":115240.0,"skew":-0.47119464533262295,"std":5268.681648676187,"zero_rate":0.0}},{"alerts":[{"code":"one_word","level":"warn","message":"45.7% rows are a single word"},{"code":"duplicates","level":"warn","message":"33.7% duplicate strings"}],"column":"PeopNameInCountry","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[1,14,101,557,661,692,665,370,202,210,277,290,329,434,330,282,175,118,67,0,87,56,65,103,195,209,192,111,69,57,37,46,45,33,22,18,1,0,1,2],"edges":[1.0,1.95,2.9,3.8499999999999996,4.8,5.75,6.699999999999999,7.6499999999999995,8.6,9.549999999999999,10.5,11.45,12.399999999999999,13.35,14.299999999999999,15.25,16.2,17.15,18.099999999999998,19.05,20.0,20.95,21.9,22.849999999999998,23.799999999999997,24.75,25.7,26.65,27.599999999999998,28.549999999999997,29.5,30.45,31.4,32.349999999999994,33.3,34.25,35.199999999999996,36.15,37.1,38.05,39.0]},"near_unique":false,"sample":["Arab","Mansoori","Pa'a, Afawa","Biafada","Ghosi (Hindu traditions)","Turk","Kandu","Tulai","Fulani, Nigerian","Arab, Moroccan","Walang","Nai (Hindu traditions)","Mulao Jia","Arab, Arabic Gulf Spoken","Zhuang, Guibian","Kulina Pano","Adyghe","Gulud","Deaf","Chunvalia","Dakpa","Bedouin, Nail","Jewish, English-speaking","Chechen","Darzi Mathuria (Muslim traditions)","Baloch Qaisrani","Ramdasia (Hindu traditions)","Jama Mapun, Bajau Kagayan","Han Chinese, Hakka","Turk","Jat Autrah","Rajput Garewal (Muslim traditions)","Rajput Chauhan (Muslim traditions)","Bolodia","Badwa","Ho","Phuma","Khumra (Muslim traditions)","Kamboh (Hindu traditions)","Vaddar (Muslim traditions)","Temein, Arabized","Nasu, Southern","Miao, Baishi","Naheng","Uzbek, Northern","Turk, Meskhetian","Punjabi, Western","Bote-Majhi","Jewish Tat, Mountain Jewish","Zarma"],"top_values":[["Deaf",151],["Turk",38],["Persian",36],["Japanese",34],["South Asian, general",34],["Kurd, Kurmanji",27],["Thai",27],["Arab, Moroccan",25],["Somali",25],["Arab, Sudanese",23],["Urdu",23],["Malay",21],["Nepali, general",21],["Afghani, general",21],["Bosniak",20],["Gujarati",19],["Algerian, Arabic-speaking",18],["Arab, Iraqi",18],["Punjabi",18],["South Asian, Bengali-speaking",17]],"top_words":[["traditions)",977],["(hindu",487],["(muslim",421],["pashtun",239],["jat",232],["arab,",220],["rajput",208],["deaf",151],["brahmin",126],["jewish,",116],["general",96],["bania",74],["south",65],["(sikh",63],["berber,",61],["asian,",59],["baloch",54],["khel",52],["tai",50],["northern",49],["western",49],["turk",47],["southern",46],["persian",38],["kurd,",37]],"vocab_skipped":null,"word_histogram":{"counts":[3259,0,0,0,0,0,0,2462,0,0,0,0,0,0,0,1095,0,0,0,0,0,0,297,0,0,0,0,0,0,11],"edges":[1.0,1.1333333333333333,1.2666666666666666,1.4,1.5333333333333332,1.6666666666666665,1.8,1.9333333333333333,2.0666666666666664,2.2,2.333333333333333,2.466666666666667,2.6,2.7333333333333334,2.8666666666666667,3.0,3.1333333333333333,3.2666666666666666,3.4,3.533333333333333,3.6666666666666665,3.8,3.933333333333333,4.066666666666666,4.2,4.333333333333334,4.466666666666667,4.6,4.733333333333333,4.866666666666667,5.0]}},"kind":"text","n":7124,"n_null":0,"n_unique":4722,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.3371701291409321,"emoji_rate":0.0,"len_max":39,"len_mean":12.50042111173498,"len_median":11.0,"len_min":1,"len_p95":27.0,"n_duplicates":2402,"n_empty":0,"one_word_rate":0.45746771476698483,"readability_flesch_mean":56.379325000000016,"url_rate":0.0,"vocab_size":4602,"word_mean":1.784250421111735,"word_median":2.0}},{"alerts":[],"column":"ROG2","extras":{"singletons":0,"top_values":[["ASI",5351],["AFR",986],["EUR",431],["NAR",175],["LAM",106],["AUS",39],["SOP",36]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":7,"null_rate":0.0,"stats":{"cardinality":7,"entropy":1.2511950244229526,"entropy_ratio":0.44568466017325303,"top_rate":0.7511229646266142,"top_value":"ASI"}},{"alerts":[],"column":"Continent","extras":{"singletons":0,"top_values":[["Asia",5351],["Africa",986],["Europe",431],["North America",175],["South America",106],["Australia",39],["Oceania",36]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":7,"null_rate":0.0,"stats":{"cardinality":7,"entropy":1.2511950244229526,"entropy_ratio":0.44568466017325303,"top_rate":0.7511229646266142,"top_value":"Asia"}},{"alerts":[],"column":"RegionName","extras":{"singletons":0,"top_values":[["Asia, South",3349],["Asia, Southeast",726],["Asia, Northeast",521],["Africa, West and Central",460],["Africa, North and Middle East",444],["Africa, East and Southern",373],["Asia, Central",352],["Europe, Western",320],["Europe, Eastern and Eurasia",223],["America, North and Caribbean",160],["America, Latin",121],["Australia and Pacific",75]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":12,"null_rate":0.0,"stats":{"cardinality":12,"entropy":2.715172154839157,"entropy_ratio":0.7573781188207601,"top_rate":0.4701010668163953,"top_value":"Asia, South"}},{"alerts":[],"column":"ISO3","extras":{"singletons":35,"top_values":[["IND",2032],["PAK",767],["CHN",442],["BGD",256],["IDN",234],["NPL",184],["SDN",168],["LAO",142],["RUS",115],["USA",90],["IRN",85],["TCD",81],["MYS",78],["THA",73],["VNM",69],["TUR",61],["MMR",59],["AFG",58],["LKA",55],["CAN",52]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":202,"null_rate":0.0,"stats":{"cardinality":202,"entropy":5.058444860597964,"entropy_ratio":0.660525616456381,"top_rate":0.2852330151600225,"top_value":"IND"}},{"alerts":[{"code":"multilingual","level":"info","message":"11 languages detected in sample"},{"code":"null_rate","level":"warn","message":"64.2% null"}],"column":"LocationInCountry","extras":{"language_counts":{"__engine":"fasttext:1,729","ceb":1,"de":4,"en":1714,"eo":2,"es":1,"id":1,"ilo":1,"it":2,"min":1,"pt":2},"language_sample_size":5000,"length_histogram":{"counts":[327,413,323,303,234,153,116,84,75,48,55,46,42,46,33,31,19,24,40,17,19,12,10,14,10,10,11,7,4,2,3,4,7,1,1,1,1,0,1,1],"edges":[3.0,26.4,49.8,73.19999999999999,96.6,120.0,143.39999999999998,166.79999999999998,190.2,213.6,237.0,260.4,283.79999999999995,307.2,330.59999999999997,354.0,377.4,400.79999999999995,424.2,447.59999999999997,471.0,494.4,517.8,541.1999999999999,564.5999999999999,588.0,611.4,634.8,658.1999999999999,681.5999999999999,705.0,728.4,751.8,775.1999999999999,798.5999999999999,822.0,845.4,868.8,892.1999999999999,915.5999999999999,939.0]},"near_unique":false,"sample":["Gulf Bedu or village peoples","Widespread. Formerly Zanzibar, coastal areas.","A 1987 linguistic study listed 91,000 speakers of the Northern Khampa Tibetan language. They occupy the large, sparsely populated Yushu Tibetan Autonomous Prefecture in southern Qinghai Province. Northern Khampa is spoken as far north as the 5,214-meter-high (17,100 ft.) Mount Yagradagze. In addition, a small number of Northern Khampa spill over the border into northeast Tibet. The nomadic Northern Khampa live on a high plateau where they herd sheep, goats, and yaks.","Janub Darfur State, Daju hills 40 km northeast of Nyala; Gharb Darfur state: Geneina district; Lagowa dialect: Janub Kurdufan state: Lagawa, Dar el Kabira (Kidong), Silecce, Warina, Jebel Miheila, Nyukri, and Tamanyik area villages.","Nan province: Bo Kluea district, Laos-Thailand border.","Siberia, most in Sakha (Yakutiya), and Krasnoyarskiy Kray; also in Irkutskaya Oblast\u2019, Buryatiya, Zabaykalsky, and Amurskaya Oblast\u2019; Pacific coast settlements, Magadanskaya Oblast\u2019, Chukotskiy Avtonomnyy Okrug, Khabarovskiy Kray, Kamchatka, and Sakhalinskaya Oblast\u2019.","Phongali and Oudomxai provinces, Samphan and Namo districts.","The Boyu Tibetans live in the large Boyu Village in Zhugqu County. Zhugqu is within the Gaanan Prefecture in poverty-stricken Gansu Province. They live atop a 3,000- meter-high (9,840 ft.) mountain. \"Boyu is located at the heart of a complex of high peaks and deep ravines, and the paths along which they climb lead through magnificent scenery\u2026 dotted with all kinds of flowers: azaleas, camellias, peonies, wolf-berries.\"","Upper portion of Tana river","Agadez region: Bilma north from N\u2019guigmi to Libya border; Diffa region; Zinder region: Goure department.","New York (Queens), Washington D.C., Detroit, Houston, Philadelphia, Atlanta, Los Angeles","Yunnan province: Honghe and Yi autonomous prefectures, Jinping Miao-Yao-Dai autonomous county, Mengla district, Manzhang-Shangzhai and Mangzhang-Xiazhai villages.","States of Selangor and Perak","Az Zahirah and Al Batinah governorates.","Mindanao, Sultan Kudarat Province, Kalamansig, Palimbang, and Ninoy Aquino municipalities; South Cotabato Province, T\u2019Boli municipality.","Hormozg\u0101n: Qeshm, Shah\u0101b, L\u0101rak, L\u0101rak Shahri. Spoken in a single town in Iran.","There is no single cohesive Japanese community or village in China. They are scattered throughout towns and villages in what was formerly called Manchuria, now the northeastern Chinese provinces of Heilongjiang, Jilin, and Liaoning.","Shan state: Taunggyi district, Kalaw, and Pinlong townships.","Scattered.","East Savannahkhet Province, Sepone district; southeast Khammouan Province, Boulapha district.","Sumatera Selatan Province, Ogan Komering Ulu Selatan, Ogan Komering Ulu Timur, Ogan Komering Ulu, and Ogan Ilir regencies; separate areas along Komering river from Ranaumeer to near Palembang city.","Widespread.","Shabeellaha Hoose and Jubbada Dhexe regions: Dhiinsoor, Baraawe, and Jilib districts; Bay and Jubbada Hoose regions.","Kagoshima Prefecture, north central Okinawa, Yoron island.","Janub Kurdufan state: Keiga Jirru, and 6 villages northeast of Kadugli.","Janub Kurdufan state: Tegali and Rashad hills and Rashad town.","Konar province: Konar river valley. 8 or 9 villages.","North near Caspian Sea, Mazandaran Province; some also in Semnan and Golestan provinces.","Primarily north","Buxoro, Jizzax, Navoiy, Qashqadaryo, Samarqand, and Sirdaryo provinces.","Donga department: Ouak\u00e9 commune, Semere town area.","Kebbi state: Argungu and Bagudo LGAs, on upper Niger river.","Widespread; eastern Syrian desert.","Chinese scholars in the 1990s discovered that Baheng speakers in southern Guizhou and northern Guangxi divided into two distinct language groups. The larger group was labeled Baheng, Sanjiang, while this smaller group (4,000 people) was named Baheng, Liping after the county which they primarily inhabit in Guizhou Province. Liping is home to several minorities, including the Mjuniang and the Dong.","Sarawak, Kapit Division, upper Rajom and Tatau rivers, Baleh.","Houaphan province, Xiangkho district","Nearly all in north Cyprus","Their communities spill into at least eight provinces (of central and western Thailand), including Phichit, Suphan Buri, Uthai Thani, Chai Nat, Phitsanulok, Kamphaeng Phet, Nakhon Pathom and Nakhon Sawan.","North Shan State; east Kachin State.","Guangxi Zhuang Autonomous Region: Lingui county, Guilin muncipality; Chadong district (most villages), Liangjiang township; Yongfu county, Longjiang district.","South Kordofan state: Abul and Heiban towns.","Phongsaly province, Khua, Samphan, Mai districts","Sulawesi Tengah Province, Parigi Moutong subdistrict, north peninsula, south coast, facing gulf of Tomini: Bolano village.","Oudomxay and Phongsaly provinces, Namo and Bountay districts","Provinces of Herat, Hazarajat, Balkh, Ghor, Ghazni, Budaksham, Panjsher; Galcha-Pamir Mountains; Kabul regions. Dari in Khorasan Province (Iran)","Approximately 10,000 Saragh (Western) Yugur live in the western part of the Sunan Yugur Autonomous County, in the narrow northern corridor of Gansu Province. The nearest town to the Saragh Yugur is Zhangye. Other Saragh Yugur communities are located in the Dahe and Minghua districts, and in the Huangnibao area near Jiuquan City in western Gansu.","Peninsular, Pahang, Terengganu, and Kelantan states.","Approximately 17,000 Bunuo people live in a small area within Du'an County in the western part of the Guangxi Zhuang Autonomous Region in southern China. Du'an is an isolated mountainous area on the road between Debao and Jingxi townships.","Kilifi, Lamu, and Tana River counties.","In 1983 Chinese linguist Sun Hongkai listed 5,000 speakers of the Namuyi language. The majority are located in the western parts of the Liangshan (Cold Mountains) Prefecture in southern Sichuan Province. Although small in number, the Namuyi are geographically widespread, inhabiting parts of Mianning, Muli, Xichang, and Yanyuan counties in the Liangshan Prefecture, in addition to parts of Jiulong County in Garze Prefecture."],"top_values":[["Widespread.",56],["Primarily north",46],["The Zhuang are the largest minority group in China. With more than 17 million people, their population is approximately the same as the population of Australia. More than 11 million people speak the various Zhuang languages. The majority are located in the central and western parts of Guangxi in southern China. Others are scattered throughout 15 of the other 29 provinces in China, including one small Zhuang enclave in distant Shaanxi Province.",14],["Widespread",12],["Widespread, especially in the north.",10],["Scattered.",10],["Sumatra island, Sumatera Selatan Province; east down Lematang and Ogan river valleys, south of Muaraenim town, east and southeast of Lahat town; Bengkulu Province; central Bukit Barisan highlands west to Indian Ocean along Bengkulu coast; Lampung Province, 4 separate enclaves.",10],["Widespread, especially north and central.",10],["Dagestan Republic.",9],["Widespread in Peninsular Malaysia; also in Sarawak state: Kuching, Samarahan, Sri Aman, and Betong districts.",9],["East and south central.",9],["Scattered",8],["Widespread. Formerly Zanzibar, coastal areas.",7],["Widespread, south of Atlas Mountains, including Sahara port cities.",7],["Sumatera Selatan Province, widespread in northern 2 thirds of province; Musi river upstream to Bukit Barisan mountains, downstream to eastern coastal swamplands; into northeast Lampung Province; a few small border areas in Jambi and Bengkulu provinces.",6],["Attapue province, Samakkhixay district",6],["Widespread in the Indonesian Archipelago; west central Sumatra, Padang area. Nearly half live outside central Sumatra; South Sumatra, west coast Mukomuko area",5],["Widespread throughout Indonesia; mainly in Jawa Tengah, Yogyakarta, Jawa Timur, and Lampung provinces; scattered enclaves on Sumatra island and resettlements in Papua, Sulawesi, Maluku, and Kalimantan.",5],["Southernmost Sumatra island, 3 provinces, many communities near or on Selat Sunda, west, central, and south Lampung Province, regencies: Lampung Barat and Tanggamus, southwest coast and coastline around Semangko bay, Way Kanan, Lampung Utara, and Pringsewu, inland, southeast tip, Lampung Selatan, east coast of Lampung bay and nearby islands Sebuku, Sebesi, Tabuan, and Legundi; Sumatera Selatan Province, Ogan Komering Ulu Selatan, Ogan Komering Ulu Timur, and Ogan Komering Ulu regencies, near headwaters of Kanan river; south Bengkulu Province, Kaur regency.",5],["Montreal",4]],"top_words":[["the",2270],["and",2177],["in",2066],["of",2016],["province,",497],["live",462],["to",415],["are",407],["a",368],["north",345],["region:",341],["south",317],["province.",297],["is",240],["east",210],["district",207],["west",202],["southern",202],["they",200],["area",199],["people",197],["yunnan",191],["province:",186],["river",184],["central",182]],"vocab_skipped":null,"word_histogram":{"counts":[719,468,412,210,129,88,61,92,49,42,42,28,31,49,17,25,15,10,11,10,16,5,3,3,4,2,3,0,2,2],"edges":[1.0,6.133333333333334,11.266666666666667,16.400000000000002,21.533333333333335,26.666666666666668,31.800000000000004,36.93333333333334,42.06666666666667,47.2,52.333333333333336,57.46666666666667,62.60000000000001,67.73333333333333,72.86666666666667,78.0,83.13333333333334,88.26666666666668,93.4,98.53333333333335,103.66666666666667,108.80000000000001,113.93333333333334,119.06666666666668,124.20000000000002,129.33333333333334,134.46666666666667,139.60000000000002,144.73333333333335,149.86666666666667,155.0]}},"kind":"text","n":7124,"n_null":4576,"n_unique":2176,"null_rate":0.6423357664233577,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.14599686028257458,"emoji_rate":0.0,"len_max":939,"len_mean":141.07339089481945,"len_median":89.0,"len_min":3,"len_p95":455.6500000000001,"n_duplicates":372,"n_empty":0,"one_word_rate":0.04317111459968603,"readability_flesch_mean":41.644913898198155,"url_rate":0.0,"vocab_size":10936,"word_mean":21.145211930926216,"word_median":12.0}},{"alerts":[{"code":"outliers","level":"warn","message":"32.9% rows beyond 1.5 IQR"}],"column":"PeopleID1","extras":{"histogram":{"counts":[475,0,140,0,0,166,0,83,0,0,225,0,128,0,0,81,0,339,0,0,3,0,13,0,0,451,0,3681,0,0,632,0,287,0,0,269,0,0,0,151],"edges":[10.0,10.4,10.8,11.2,11.6,12.0,12.4,12.8,13.2,13.6,14.0,14.4,14.8,15.2,15.600000000000001,16.0,16.4,16.8,17.2,17.6,18.0,18.4,18.8,19.200000000000003,19.6,20.0,20.4,20.8,21.200000000000003,21.6,22.0,22.4,22.8,23.200000000000003,23.6,24.0,24.4,24.8,25.200000000000003,25.6,26.0]},"sample":[10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,11.0,11.0,11.0,11.0,11.0,11.0,11.0,11.0,11.0,11.0,11.0,12.0,12.0,12.0,12.0,12.0,12.0,12.0,12.0,12.0,12.0,12.0,12.0,12.0,13.0,13.0,13.0,13.0,13.0,13.0,13.0,13.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,15.0,15.0,15.0,15.0,15.0,15.0,15.0,15.0,15.0,15.0,15.0,16.0,16.0,16.0,16.0,16.0,16.0,16.0,17.0,17.0,17.0,17.0,17.0,17.0,17.0,17.0,17.0,17.0,17.0,17.0,17.0,17.0,17.0,17.0,19.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,22.0,23.0,23.0,23.0,23.0,23.0,23.0,23.0,23.0,23.0,23.0,23.0,23.0,23.0,23.0,23.0,23.0,23.0,23.0,23.0,23.0,23.0,23.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,26.0,26.0,26.0,26.0,26.0,26.0,26.0,26.0,26.0,26.0,26.0,26.0,26.0,26.0,26.0,26.0,26.0,26.0]},"kind":"numeric","n":7124,"n_null":0,"n_unique":16,"null_rate":0.0,"stats":{"iqr":1.0,"kurtosis":0.8321442942311568,"max":26.0,"mean":19.51137001684447,"median":21.0,"min":10.0,"n_outliers":2347,"outlier_rate":0.329449747332959,"q1":20.0,"q3":21.0,"skew":-1.3369368010443223,"std":3.8582579713808585,"zero_rate":0.0}},{"alerts":[],"column":"ROP1","extras":{"singletons":0,"top_values":[["A012",3681],["A013",632],["A001",475],["A011",451],["A008",339],["A014",287],["A015",269],["A005",225],["A003",166],["A017",151],["A002",140],["A006",128],["A004",83],["A007",81],["A010",13],["A009",3]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":16,"null_rate":0.0,"stats":{"cardinality":16,"entropy":2.6758432956930482,"entropy_ratio":0.6689608239232621,"top_rate":0.5167040988208872,"top_value":"A012"}},{"alerts":[],"column":"AffinityBloc","extras":{"singletons":0,"top_values":[["South Asian Peoples",3681],["Sub-Saharan Peoples",632],["Arab World",475],["Southeast Asian Peoples",451],["Malay Peoples",339],["Tibetan-Himalayan Peoples",287],["Turkic Peoples",269],["Persian-Median",225],["Eurasian Peoples",166],["Deaf",151],["East Asian Peoples",140],["Jewish",128],["Horn of Africa Peoples",83],["Latin-Caribbean Americans",81],["Pacific Islanders",13],["North American Peoples",3]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":16,"null_rate":0.0,"stats":{"cardinality":16,"entropy":2.6758432956930482,"entropy_ratio":0.6689608239232621,"top_rate":0.5167040988208872,"top_value":"South Asian Peoples"}},{"alerts":[],"column":"PeopleID2","extras":{"histogram":{"counts":[72,353,99,58,74,217,156,86,92,67,188,111,122,84,222,136,34,144,3,68,194,147,223,256,160,14,58,8,0,0,0,0,100,573,216,50,928,128,1136,547],"edges":[101.0,110.35,119.7,129.05,138.4,147.75,157.1,166.45,175.8,185.14999999999998,194.5,203.85,213.2,222.55,231.9,241.25,250.6,259.95,269.29999999999995,278.65,288.0,297.35,306.7,316.04999999999995,325.4,334.75,344.1,353.45,362.8,372.15,381.5,390.84999999999997,400.2,409.55,418.9,428.25,437.59999999999997,446.95,456.3,465.65,475.0]},"sample":[111.0,115.0,115.0,111.0,117.0,118.0,112.0,113.0,113.0,113.0,113.0,113.0,114.0,121.0,115.0,115.0,141.0,112.0,118.0,145.0,145.0,118.0,137.0,113.0,143.0,113.0,162.0,194.0,194.0,161.0,298.0,161.0,238.0,238.0,238.0,238.0,162.0,157.0,157.0,284.0,284.0,284.0,157.0,157.0,157.0,284.0,284.0,119.0,169.0,354.0,253.0,287.0,287.0,256.0,256.0,253.0,253.0,253.0,327.0,208.0,208.0,208.0,208.0,208.0,208.0,268.0,299.0,268.0,268.0,251.0,299.0,300.0,268.0,299.0,268.0,208.0,299.0,197.0,197.0,197.0,197.0,197.0,197.0,197.0,197.0,197.0,197.0,197.0,290.0,290.0,290.0,290.0,108.0,108.0,290.0,209.0,152.0,308.0,101.0,229.0,215.0,266.0,215.0,209.0,153.0,318.0,167.0,196.0,215.0,155.0,177.0,244.0,239.0,239.0,303.0,303.0,230.0,319.0,239.0,239.0,295.0,297.0,260.0,160.0,303.0,319.0,230.0,230.0,295.0,230.0,239.0,295.0,239.0,239.0,295.0,322.0,322.0,239.0,239.0,239.0,239.0,239.0,239.0,239.0,462.0,462.0,402.0,442.0,442.0,412.0,427.0,475.0,442.0,462.0,412.0,442.0,442.0,442.0,462.0,402.0,402.0,463.0,462.0,462.0,462.0,455.0,475.0,468.0,412.0,442.0,450.0,442.0,442.0,442.0,475.0,412.0,421.0,462.0,442.0,442.0,442.0,442.0,442.0,417.0,462.0,462.0,412.0,442.0,462.0,462.0,442.0,407.0,462.0,442.0,442.0,462.0,412.0,462.0,442.0,462.0,442.0,442.0,442.0,412.0,412.0,442.0,412.0,442.0,412.0,442.0,412.0,442.0,475.0,442.0,442.0,442.0,442.0,442.0,442.0,475.0,419.0,442.0,431.0,468.0,475.0,475.0,442.0,412.0,412.0,475.0,433.0,442.0,442.0,442.0,442.0,442.0,442.0,442.0,442.0,462.0,442.0,412.0,462.0,462.0,412.0,462.0,458.0,462.0,462.0,462.0,462.0,462.0,442.0,462.0,462.0,442.0,442.0,442.0,442.0,442.0,412.0,412.0,462.0,412.0,442.0,475.0,475.0,412.0,412.0,412.0,442.0,462.0,475.0,442.0,442.0,462.0,442.0,470.0,470.0,412.0,462.0,442.0,462.0,412.0,412.0,412.0,412.0,442.0,412.0,462.0,442.0,412.0,402.0,462.0,468.0,468.0,468.0,468.0,402.0,442.0,462.0,416.0,416.0,458.0,427.0,458.0,458.0,427.0,427.0,458.0,458.0,417.0,417.0,417.0,417.0,417.0,417.0,417.0,427.0,469.0,458.0,417.0,442.0,417.0,417.0,464.0,464.0,455.0,416.0,417.0,420.0,420.0,420.0,420.0,420.0,412.0,464.0,472.0,473.0,473.0,442.0,442.0,475.0,462.0,475.0,442.0,443.0,443.0,443.0,446.0,406.0,412.0,447.0,442.0,402.0,407.0,458.0,475.0,442.0,464.0,446.0,475.0,464.0,464.0,462.0,463.0,412.0,471.0,417.0,442.0,458.0,469.0,458.0,458.0,413.0,464.0,464.0,420.0,406.0,465.0,466.0,450.0,455.0,458.0,458.0,458.0,463.0,463.0,463.0,463.0,463.0,463.0,463.0,463.0,463.0,463.0,463.0,463.0,463.0,463.0,464.0,462.0,475.0,415.0,463.0,464.0,462.0,249.0,218.0,183.0,102.0,180.0,183.0,288.0,183.0,248.0,181.0,159.0,158.0,158.0,218.0,158.0,351.0,289.0,289.0,158.0,351.0,351.0,245.0,288.0,173.0,102.0,124.0,248.0,248.0,218.0,124.0,264.0,245.0,248.0,304.0,304.0,317.0,317.0,304.0,317.0,317.0,317.0,317.0,304.0,247.0,317.0,317.0,317.0,317.0,317.0,304.0,317.0,317.0,154.0,317.0,207.0,311.0,126.0,202.0,202.0,204.0,311.0,311.0,126.0,309.0,311.0,311.0,311.0,313.0,313.0,313.0,309.0,204.0,313.0,107.0,314.0,328.0,328.0,328.0,328.0,328.0,328.0,328.0,328.0,328.0,328.0,328.0,328.0,328.0,328.0,328.0,328.0,328.0,328.0]},"kind":"numeric","n":7124,"n_null":0,"n_unique":205,"null_rate":0.0,"stats":{"iqr":217.25,"kurtosis":-1.241582324287736,"max":475.0,"mean":339.0130544637844,"median":412.0,"min":101.0,"n_outliers":0,"outlier_rate":0.0,"q1":232.75,"q3":450.0,"skew":-0.5034591288285603,"std":123.20329449313641,"zero_rate":0.0}},{"alerts":[],"column":"ROP2","extras":{"singletons":11,"top_values":[["A012",3678],["C0229",169],["C0147",167],["C0252",151],["C0102",128],["C0061",111],["C0179",90],["C0207",86],["C0013",76],["C0156",75],["C0223",75],["C0015",70],["C0221",68],["C0126",63],["C0114",61],["C0017",59],["C0019",58],["C0216",52],["C0062",51],["C0201",50]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":155,"null_rate":0.0,"stats":{"cardinality":155,"entropy":4.085050127180254,"entropy_ratio":0.5614321443183582,"top_rate":0.5162829870859068,"top_value":"A012"}},{"alerts":[],"column":"PeopleCluster","extras":{"singletons":11,"top_values":[["South Asia Hindu - other",869],["South Asia Muslim - other",586],["South Asia Dalit - other",352],["South Asia Tribal - other",311],["South Asia Muslim - Pashtun",293],["Tibeto-Burman, other",169],["Mon-Khmer",167],["Deaf",151],["South Asia Muslim - Jat",138],["Jewish",128],["South Asia Forward Caste - Brahmin",123],["South Asia - other",114],["South Asia Muslim - Rajput",112],["Caucasus",111],["South Asia Forward Caste - Rajput",95],["Persian",90],["South Asia Buddhist",87],["Tai",86],["South Asia Hindu - Jat",77],["Arab, Arabian",76]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":205,"null_rate":0.0,"stats":{"cardinality":205,"entropy":6.107948337574699,"entropy_ratio":0.7953596152906298,"top_rate":0.12198203256597417,"top_value":"South Asia Hindu - other"}},{"alerts":[{"code":"one_word","level":"warn","message":"47.5% rows are a single word"},{"code":"duplicates","level":"warn","message":"35.4% duplicate strings"}],"column":"PeopNameAcrossCountries","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[1,14,95,582,679,736,689,382,206,209,270,277,308,420,310,253,164,103,67,0,79,55,64,105,205,209,194,115,67,57,36,50,45,33,18,22,1,1,1,2],"edges":[1.0,1.95,2.9,3.8499999999999996,4.8,5.75,6.699999999999999,7.6499999999999995,8.6,9.549999999999999,10.5,11.45,12.399999999999999,13.35,14.299999999999999,15.25,16.2,17.15,18.099999999999998,19.05,20.0,20.95,21.9,22.849999999999998,23.799999999999997,24.75,25.7,26.65,27.599999999999998,28.549999999999997,29.5,30.45,31.4,32.349999999999994,33.3,34.25,35.199999999999996,36.15,37.1,38.05,39.0]},"near_unique":false,"sample":["Arab","Mansoori","Pa'a","Biafada","Ghosi (Hindu traditions)","Turk","Kandu","Tulai","Fulani, Nigerian","Arab, Moroccan","Walang","Nai (Hindu traditions)","Mulao Jia","Arab, Arabic Gulf Spoken","Zhuang, Guibian","Kulina Pano","Adyghe","Gulud","Deaf","Chunvalia","Dakpa","Bedouin, Nail","Jewish, English-speaking","Chechen","Darzi Mathuria (Muslim traditions)","Baloch Qaisrani","Ramdasia (Hindu traditions)","Sama, Mapun","Han Chinese, Hakka","Turk","Jat Autrah","Rajput Garewal (Muslim traditions)","Rajput Chauhan (Muslim traditions)","Bolodia","Badwa","Ho","Phuma","Khumra (Muslim traditions)","Kamboh (Hindu traditions)","Vaddar (Muslim traditions)","Temein, Arabized","Nasu, Southern","Miao, Baishi","Naheng","Uzbek, Northern","Turk, Meskhetian","Punjabi, Western","Bote-Majhi","Jewish Tat, Mountain Jewish","Zarma"],"top_values":[["Deaf",151],["Turk",38],["Persian",36],["Japanese",34],["South Asian, general",34],["Kurd, Kurmanji",28],["Somali",27],["Thai",27],["Arab, Moroccan",25],["Urdu",24],["Arab, Sudanese",23],["Nepali, general",23],["Malay",22],["Afghani, general",21],["Bosniak",20],["Gujarati",20],["Punjabi",19],["Algerian, Arabic-speaking",18],["Arab, Iraqi",18],["Swahili",18]],"top_words":[["traditions)",985],["(hindu",492],["(muslim",424],["pashtun",237],["jat",232],["arab,",216],["rajput",208],["deaf",151],["brahmin",126],["jewish,",115],["general",100],["bania",74],["(sikh",63],["berber,",61],["south",61],["asian,",57],["baloch",54],["northern",52],["tai",52],["khel",52],["western",47],["southern",46],["turk",46],["kurd,",37],["persian",36]],"vocab_skipped":null,"word_histogram":{"counts":[3384,0,0,0,0,0,0,2345,0,0,0,0,0,0,0,1082,0,0,0,0,0,0,302,0,0,0,0,0,0,11],"edges":[1.0,1.1333333333333333,1.2666666666666666,1.4,1.5333333333333332,1.6666666666666665,1.8,1.9333333333333333,2.0666666666666664,2.2,2.333333333333333,2.466666666666667,2.6,2.7333333333333334,2.8666666666666667,3.0,3.1333333333333333,3.2666666666666666,3.4,3.533333333333333,3.6666666666666665,3.8,3.933333333333333,4.066666666666666,4.2,4.333333333333334,4.466666666666667,4.6,4.733333333333333,4.866666666666667,5.0]}},"kind":"text","n":7124,"n_null":0,"n_unique":4604,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.35373385738349244,"emoji_rate":0.0,"len_max":39,"len_mean":12.377596855699046,"len_median":10.0,"len_min":1,"len_p95":27.0,"n_duplicates":2520,"n_empty":0,"one_word_rate":0.4750140370578327,"readability_flesch_mean":56.011600000000016,"url_rate":0.0,"vocab_size":4431,"word_mean":1.7662829870859067,"word_median":2.0}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=+21.10"},{"code":"outliers","level":"warn","message":"14.9% rows beyond 1.5 IQR"}],"column":"Population","extras":{"histogram":{"counts":[6930,78,36,17,11,8,7,3,2,1,2,4,0,3,1,0,1,0,1,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,1],"edges":[10.0,3388334.75,6776659.5,10164984.25,13553309.0,16941633.75,20329958.5,23718283.25,27106608.0,30494932.75,33883257.5,37271582.25,40659907.0,44048231.75,47436556.5,50824881.25,54213206.0,57601530.75,60989855.5,64378180.25,67766505.0,71154829.75,74543154.5,77931479.25,81319804.0,84708128.75,88096453.5,91484778.25,94873103.0,98261427.75,101649752.5,105038077.25,108426402.0,111814726.75,115203051.5,118591376.25,121979701.0,125368025.75,128756350.5,132144675.25,135533000.0]},"sample":[211000.0,320000.0,98000.0,20000.0,16000.0,14000.0,104000.0,21000.0,311000.0,21070000.0,18000.0,20000.0,26000.0,12000.0,1100.0,9000.0,45000.0,203000.0,16000.0,249000.0,20000.0,7000.0,178000.0,1200.0,10988000.0,512000.0,70000.0,90000.0,7200.0,6200.0,49000.0,297000.0,35408000.0,5700.0,51000.0,49000.0,9200.0,13000.0,46000.0,2000.0,23000.0,24000.0,118000.0,272000.0,5700.0,23000.0,400.0,34000.0,4700.0,1300.0,10000.0,20000.0,15000.0,45000.0,681000.0,141000.0,66000.0,101000.0,67000.0,28000.0,163000.0,8400.0,54000.0,53000.0,7700.0,11000.0,2600.0,2600.0,13000.0,7000.0,12313000.0,349000.0,9800.0,24000.0,16000.0,1300.0,26000.0,2900.0,2600.0,29000.0,119000.0,4300.0,5300.0,139000.0,7100.0,2600.0,15000.0,1500.0,1600.0,2400.0,300.0,400.0,30.0,1500.0,500.0,80.0,4143000.0,1300.0,14000.0,82000.0,5000.0,25000.0,100.0,3396000.0,700.0,167000.0,900.0,202000.0,600.0,2100.0,269000.0,377000.0,200.0,15000.0,800.0,5800.0,9000.0,102000.0,2300.0,21000.0,300.0,25000.0,1900.0,700.0,49000.0,9200.0,14000.0,3100.0,57000.0,140000.0,120000.0,15000.0,2300.0,200.0,300.0,1500.0,2160000.0,191000.0,181000.0,700.0,80000.0,1400.0,700.0,700.0,1100.0,161000.0,77000.0,58000.0,21000.0,35000.0,587000.0,19000.0,15000.0,19000.0,22000.0,1340000.0,129000.0,316000.0,12000.0,3700.0,109000.0,61000.0,167000.0,72000.0,214000.0,25000.0,5500.0,16000.0,6500.0,7400.0,310000.0,211000.0,7900.0,16000.0,96000.0,5100.0,53000.0,57000.0,34000.0,54000.0,654000.0,31000.0,147000.0,15000.0,4049000.0,19000.0,18000.0,3000.0,91000.0,6400.0,22000.0,1200.0,6400.0,23000.0,9700.0,10000.0,51000.0,43000.0,90000.0,52000.0,1300.0,6500.0,5100.0,59000.0,14000.0,12000.0,44000.0,4500.0,71000.0,53000.0,5400.0,4600.0,7000.0,1086000.0,1500.0,226000.0,2200.0,8100.0,83000.0,4200.0,4000.0,261000.0,12000.0,1700.0,42000.0,10000.0,1664000.0,13000.0,20000.0,23000.0,5700.0,17000.0,317000.0,296000.0,16133000.0,6000.0,196000.0,87000.0,8100.0,58000.0,139000.0,1300.0,19000.0,188000.0,20000.0,6000.0,42000.0,63000.0,5200.0,78000.0,118000.0,11000.0,11000.0,2700.0,836000.0,1019000.0,10000.0,12000.0,2100.0,19000.0,4800.0,55000.0,152000.0,55000.0,3200.0,40000.0,3200.0,58000.0,86000.0,63000.0,123000.0,36000.0,1373000.0,6900.0,229000.0,3342000.0,51000.0,482000.0,2000.0,1500.0,8061000.0,1100.0,93000.0,47000.0,1300.0,144000.0,6100.0,128000.0,15000.0,433000.0,144000.0,352000.0,967000.0,1600.0,78000.0,1200.0,3500.0,1300.0,3700.0,5900.0,65000.0,800.0,4900.0,34000.0,13000.0,969000.0,14000.0,76000.0,250000.0,188000.0,589000.0,1300.0,61000.0,194000.0,120000.0,84000.0,59000.0,117000.0,58000.0,78000.0,52000.0,188000.0,351000.0,43000.0,179000.0,467000.0,3346000.0,108000.0,77000.0,155000.0,3800.0,108000.0,144000.0,40000.0,44000.0,97000.0,579000.0,293000.0,566000.0,35000.0,2000.0,49000.0,104000.0,18000.0,5400.0,5100.0,125000.0,82000.0,2201000.0,1100.0,3400.0,6100.0,44000.0,78000.0,2100.0,9400.0,200000.0,14000.0,9500.0,38000.0,128000.0,25000.0,40000.0,4500.0,36000.0,3100.0,216000.0,36000.0,15000.0,61000.0,3900.0,24000.0,1792000.0,1197000.0,113000.0,8100.0,130000.0,8400.0,26000.0,24000.0,10000.0,18000.0,27000.0,23000.0,487000.0,83000.0,67000.0,50000.0,31000.0,32000.0,13000.0,28000.0,34000.0,195000.0,25000.0,80000.0,23000.0,19000.0,161000.0,55000.0,336000.0,27000.0,31000.0,3688000.0,8400.0,1200.0,4940000.0,2500.0,4100.0,1400.0,112000.0,28000.0,1735000.0,113000.0,8400.0,1200.0,147000.0,329000.0,2200.0,30000.0,67000.0,2800.0,38000.0,1080000.0,106000.0,83000.0,760000.0,1307000.0,271000.0,417000.0,6400.0,55000.0,16000.0,29000.0,11000.0,5500.0,88000.0,467000.0,122000.0,32000.0,139000.0,3700.0,11000.0,13000.0,5000.0,6900.0,3300.0,16000.0,11000.0,5400.0,1587000.0,51000.0,455000.0,1600.0,136000.0,1700.0,32000.0,38000.0,5900.0,49000.0,39000.0,18000.0,3900.0,2200.0,2900.0,1500.0,8050000.0,3600.0,1563000.0,37000.0,12000.0,500.0,500.0,2087000.0,8400.0,1143000.0,165000.0,221000.0,294000.0,73000.0,35000.0,35000.0,30.0,1300.0,60000.0,11000.0,13000.0,200.0,20000.0,126000.0,36000.0,20000.0,1000.0,59000.0,16000.0,9500.0,200.0,6000.0,200000.0,8300.0]},"kind":"numeric","n":7124,"n_null":15,"n_unique":1200,"null_rate":0.0021055586749017404,"stats":{"iqr":122300.0,"kurtosis":607.3797730299965,"max":135533000.0,"mean":502569.76086650725,"median":30000.0,"min":10.0,"n_outliers":1058,"outlier_rate":0.14882543255028838,"q1":6700.0,"q3":129000.0,"skew":21.104426485398207,"std":3568058.7981768283,"zero_rate":0.0}},{"alerts":[],"column":"Category","extras":{"singletons":0,"top_values":[["3",4299],["1",2330],["2",495]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":3,"null_rate":0.0,"stats":{"cardinality":3,"entropy":1.2343870839379618,"entropy_ratio":0.7788115386807682,"top_rate":0.6034531162268388,"top_value":"3"}},{"alerts":[{"code":"one_word","level":"warn","message":"100.0% rows are a single word"},{"code":"short_text","level":"info","message":"95th-percentile length under 20 chars"},{"code":"duplicates","level":"warn","message":"78.0% duplicate strings"}],"column":"ROL3","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,7124,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[2.5,2.525,2.55,2.575,2.6,2.625,2.65,2.675,2.7,2.725,2.75,2.775,2.8,2.825,2.85,2.875,2.9,2.925,2.95,2.975,3.0,3.025,3.05,3.075,3.1,3.125,3.15,3.175,3.2,3.225,3.25,3.275,3.3,3.325,3.35,3.375,3.4,3.425,3.45,3.475,3.5]},"near_unique":false,"sample":["acm","guj","pqa","bif","hin","tur","bho","hau","fuv","ary","bap","hin","cmn","afb","zgn","xpk","ady","apd","rsl","guj","dka","arq","eng","che","hin","bgp","pan","sjm","hak","tur","skr","pan","snd","ory","hin","syl","ypm","skr","hin","urd","apd","yiv","cmn","nxq","uzn","kat","pnb","bmj","jdt","dje"],"top_values":[["hin",662],["ben",357],["snd",191],["urd",167],["guj",155],["ory",150],["pbu",146],["skr",140],["tel",136],["pan",131],["pnb",130],["tam",129],["apd",110],["xxx",104],["mar",96],["kan",90],["mal",85],["npi",71],["pst",71],["mai",69]],"top_words":[["hin",662],["ben",357],["snd",191],["urd",167],["guj",155],["ory",150],["pbu",146],["skr",140],["tel",136],["pan",131],["pnb",130],["tam",129],["apd",110],["xxx",104],["mar",96],["kan",90],["mal",85],["npi",71],["pst",71],["mai",69],["tur",55],["apc",52],["cmn",50],["kmr",44],["bcc",37]],"vocab_skipped":null,"word_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,7124,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[0.5,0.5333333333333333,0.5666666666666667,0.6,0.6333333333333333,0.6666666666666666,0.7,0.7333333333333334,0.7666666666666666,0.8,0.8333333333333333,0.8666666666666667,0.9,0.9333333333333333,0.9666666666666667,1.0,1.0333333333333332,1.0666666666666667,1.1,1.1333333333333333,1.1666666666666665,1.2,1.2333333333333334,1.2666666666666666,1.3,1.3333333333333335,1.3666666666666667,1.4,1.4333333333333333,1.4666666666666668,1.5]}},"kind":"text","n":7124,"n_null":0,"n_unique":1565,"null_rate":0.0,"stats":{"allcaps_rate":0.00028074115665356543,"boilerplate_rate":0.0,"duplicate_rate":0.7803200449185851,"emoji_rate":0.0,"len_max":3,"len_mean":3.0,"len_median":3.0,"len_min":3,"len_p95":3.0,"n_duplicates":5559,"n_empty":0,"one_word_rate":1.0,"readability_flesch_mean":118.68200000000003,"url_rate":0.0,"vocab_size":1564,"word_mean":1.0,"word_median":1.0}},{"alerts":[{"code":"one_word","level":"warn","message":"70.2% rows are a single word"},{"code":"short_text","level":"info","message":"95th-percentile length under 20 chars"},{"code":"duplicates","level":"warn","message":"78.1% duplicate strings"}],"column":"PrimaryLanguageName","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[2,29,61,655,0,1267,888,1222,0,517,207,137,65,0,98,157,150,0,204,890,228,60,0,37,46,51,0,35,34,41,3,0,16,8,3,0,1,0,11,1],"edges":[1.0,1.775,2.55,3.325,4.1,4.875,5.65,6.425,7.2,7.9750000000000005,8.75,9.525,10.3,11.075000000000001,11.85,12.625,13.4,14.175,14.950000000000001,15.725,16.5,17.275000000000002,18.05,18.825,19.6,20.375,21.150000000000002,21.925,22.7,23.475,24.25,25.025000000000002,25.8,26.575,27.35,28.125,28.900000000000002,29.675,30.45,31.225,32.0]},"near_unique":false,"sample":["Arabic, Mesopotamian","Gujarati","Pa'a","Biafada","Hindi","Turkish","Bhojpuri","Hausa","Fulfulde, Nigerian","Arabic, Moroccan","Bantawa","Hindi","Chinese, Mandarin","Arabic, Gulf","Zhuang, Guibian","Kulina Pano","Adyghe","Arabic, Sudanese","Russian Sign Language","Gujarati","Dakpakha","Arabic, Algerian","English","Chechen","Hindi","Balochi, Eastern","Punjabi, Eastern","Mapun","Chinese, Hakka","Turkish","Saraiki","Punjabi, Eastern","Sindhi","Odia","Hindi","Sylheti","Phuma","Saraiki","Hindi","Urdu","Arabic, Sudanese","Nisu, Northern","Chinese, Mandarin","Naxi","Uzbek, Northern","Georgian","Punjabi, Western","Bote","Judeo-Tat","Zarma"],"top_values":[["Hindi",662],["Bengali",357],["Sindhi",191],["Urdu",167],["Gujarati",155],["Odia",150],["Pashto, Northern",146],["Saraiki",140],["Telugu",136],["Punjabi, Eastern",131],["Punjabi, Western",130],["Tamil",129],["Arabic, Sudanese",110],["Language unknown",104],["Marathi",96],["Kannada",90],["Malayalam",85],["Nepali",71],["Pashto, Central",71],["Maithili",69]],"top_words":[["hindi",662],["arabic,",422],["bengali",357],["punjabi,",261],["northern",258],["pashto,",237],["eastern",208],["language",195],["sindhi",191],["western",168],["urdu",167],["gujarati",155],["odia",150],["saraiki",140],["telugu",136],["tamil",129],["central",125],["sudanese",110],["unknown",104],["southern",100],["marathi",96],["sign",91],["kannada",90],["malayalam",85],["balochi,",72]],"vocab_skipped":null,"word_histogram":{"counts":[4998,0,0,0,0,0,0,1916,0,0,0,0,0,0,0,188,0,0,0,0,0,0,20,0,0,0,0,0,0,2],"edges":[1.0,1.1333333333333333,1.2666666666666666,1.4,1.5333333333333332,1.6666666666666665,1.8,1.9333333333333333,2.0666666666666664,2.2,2.333333333333333,2.466666666666667,2.6,2.7333333333333334,2.8666666666666667,3.0,3.1333333333333333,3.2666666666666666,3.4,3.533333333333333,3.6666666666666665,3.8,3.933333333333333,4.066666666666666,4.2,4.333333333333334,4.466666666666667,4.6,4.733333333333333,4.866666666666667,5.0]}},"kind":"text","n":7124,"n_null":0,"n_unique":1563,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.7806007860752386,"emoji_rate":0.0,"len_max":32,"len_mean":9.14654688377316,"len_median":7.0,"len_min":1,"len_p95":17.0,"n_duplicates":5561,"n_empty":0,"one_word_rate":0.70157215047726,"readability_flesch_mean":33.28345000000002,"url_rate":0.0,"vocab_size":1641,"word_mean":1.3312745648512072,"word_median":1.0}},{"alerts":[{"code":"long_tail","level":"info","message":"255 singleton categories"},{"code":"null_rate","level":"warn","message":"94.5% null"}],"column":"PrimaryLanguageDialect","extras":{"singletons":255,"top_values":[["Punjabi",12],["Ta'izzi",8],["Sinhalese",6],["Wasulunkakan",6],["Pomak",5],["Siripuria",5],["Hui",4],["Vixlin",4],["Western Sudanese",3],["Brazilian Portuguese",3],["Bawean",3],["Bajuni",3],["Miri",3],["Southern Khams",3],["Levantine Turkmen",3],["Jerbi",2],["Tawallammat Tan Ataram",2],["Tihami",2],["Timbuktu",2],["Xinan Guanhua",2]]},"kind":"categorical","n":7124,"n_null":6732,"n_unique":303,"null_rate":0.9449747332959012,"stats":{"cardinality":303,"entropy":8.011284860744478,"entropy_ratio":0.9718689520331129,"top_rate":0.030612244897959183,"top_value":"Punjabi"}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=+4.87"},{"code":"outliers","level":"warn","message":"8.4% rows beyond 1.5 IQR"}],"column":"NumberLanguagesSpoken","extras":{"histogram":{"counts":[4930,911,493,262,146,88,54,51,44,27,21,14,17,14,9,9,8,4,4,6,2,2,0,1,1,2,0,2,0,0,0,0,0,0,1,0,0,0,0,1],"edges":[1.0,3.975,6.95,9.925,12.9,15.875,18.85,21.825,24.8,27.775000000000002,30.75,33.725,36.7,39.675000000000004,42.65,45.625,48.6,51.575,54.550000000000004,57.525,60.5,63.475,66.45,69.425,72.4,75.375,78.35000000000001,81.325,84.3,87.275,90.25,93.22500000000001,96.2,99.175,102.15,105.125,108.10000000000001,111.075,114.05,117.025,120.0]},"sample":[2.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,4.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,3.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,1.0,4.0,1.0,1.0,24.0,12.0,2.0,1.0,18.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,5.0,1.0,4.0,1.0,6.0,6.0,4.0,3.0,2.0,4.0,2.0,8.0,10.0,2.0,29.0,45.0,11.0,5.0,11.0,10.0,8.0,7.0,8.0,2.0,2.0,3.0,15.0,12.0,2.0,6.0,1.0,8.0,3.0,6.0,4.0,4.0,6.0,4.0,1.0,8.0,6.0,18.0,6.0,1.0,4.0,3.0,18.0,4.0,14.0,9.0,13.0,25.0,4.0,7.0,22.0,20.0,9.0,2.0,41.0,2.0,43.0,31.0,17.0,3.0,39.0,14.0,8.0,10.0,78.0,3.0,22.0,4.0,5.0,28.0,5.0,6.0,3.0,17.0,4.0,5.0,12.0,2.0,28.0,3.0,8.0,16.0,15.0,15.0,46.0,7.0,14.0,2.0,2.0,4.0,3.0,1.0,5.0,3.0,1.0,2.0,5.0,3.0,18.0,3.0,2.0,8.0,1.0,9.0,1.0,5.0,3.0,2.0,1.0,7.0,7.0,13.0,3.0,1.0,3.0,5.0,5.0,3.0,21.0,1.0,1.0,5.0,2.0,17.0,2.0,2.0,4.0,4.0,1.0,1.0,1.0,2.0,6.0,45.0,3.0,9.0,6.0,4.0,11.0,3.0,6.0,9.0,10.0,3.0,11.0,28.0,4.0,5.0,15.0,7.0,2.0,3.0,5.0,17.0,3.0,7.0,2.0,2.0,11.0,5.0,6.0,4.0,4.0,3.0,29.0,18.0,3.0,2.0,11.0,9.0,10.0,9.0,2.0,8.0,4.0,5.0,13.0,2.0,9.0,7.0,4.0,1.0,11.0,2.0,1.0,4.0,1.0,11.0,3.0,8.0,2.0,7.0,5.0,2.0,10.0,12.0,5.0,4.0,7.0,5.0,3.0,3.0,5.0,2.0,8.0,6.0,15.0,8.0,6.0,1.0,8.0,6.0,19.0,14.0,4.0,6.0,4.0,6.0,2.0,7.0,10.0,3.0,5.0,7.0,3.0,2.0,6.0,11.0,7.0,3.0,7.0,3.0,2.0,1.0,7.0,23.0,4.0,6.0,8.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,5.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,2.0,2.0,1.0,1.0,4.0,1.0,1.0,1.0,2.0,2.0,4.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,3.0,1.0,1.0]},"kind":"numeric","n":7124,"n_null":0,"n_unique":69,"null_rate":0.0,"stats":{"iqr":4.0,"kurtosis":36.31399290367042,"max":120.0,"mean":4.333380123526109,"median":1.0,"min":1.0,"n_outliers":597,"outlier_rate":0.08380123526108928,"q1":1.0,"q3":5.0,"skew":4.871081303594153,"std":7.320285636937211,"zero_rate":0.0}},{"alerts":[],"column":"OfficialLang","extras":{"singletons":6,"top_values":[["Hindi",2032],["Urdu",767],["Arabic, Standard",657],["Chinese, Mandarin",475],["English",433],["French",303],["Bengali",256],["Indonesian",234],["Nepali",184],["Lao",142],["Russian",115],["Portuguese",94],["Malay",87],["Persian, Iranian",85],["Spanish",79],["Thai",73],["Vietnamese",69],["Turkish",61],["Burmese",59],["Pashto, Southern",58]]},"kind":"categorical","n":7124,"n_null":6,"n_unique":79,"null_rate":0.0008422234699606962,"stats":{"cardinality":79,"entropy":4.1781623127737895,"entropy_ratio":0.6628026068295618,"top_rate":0.28547344759763976,"top_value":"Hindi"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"SpeakNationalLang","extras":{},"kind":"unknown","n":7124,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"outliers","level":"warn","message":"13.5% rows beyond 1.5 IQR"}],"column":"BibleStatus","extras":{"histogram":{"counts":[272,0,0,0,0,0,0,0,216,0,0,0,0,0,0,0,473,0,0,0,0,0,0,0,795,0,0,0,0,0,0,0,1506,0,0,0,0,0,0,3862],"edges":[0.0,0.125,0.25,0.375,0.5,0.625,0.75,0.875,1.0,1.125,1.25,1.375,1.5,1.625,1.75,1.875,2.0,2.125,2.25,2.375,2.5,2.625,2.75,2.875,3.0,3.125,3.25,3.375,3.5,3.625,3.75,3.875,4.0,4.125,4.25,4.375,4.5,4.625,4.75,4.875,5.0]},"sample":[2.0,4.0,4.0,2.0,4.0,3.0,4.0,4.0,4.0,4.0,4.0,4.0,3.0,0.0,4.0,4.0,3.0,4.0,2.0,4.0,4.0,3.0,3.0,4.0,2.0,4.0,3.0,5.0,5.0,3.0,5.0,5.0,3.0,4.0,2.0,4.0,0.0,4.0,4.0,5.0,5.0,5.0,5.0,3.0,4.0,5.0,5.0,5.0,5.0,5.0,4.0,5.0,5.0,5.0,5.0,4.0,4.0,3.0,3.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,3.0,5.0,5.0,2.0,5.0,4.0,5.0,3.0,2.0,5.0,2.0,5.0,5.0,5.0,5.0,0.0,5.0,0.0,0.0,5.0,5.0,4.0,4.0,5.0,5.0,5.0,5.0,5.0,5.0,3.0,2.0,2.0,3.0,3.0,0.0,4.0,5.0,4.0,2.0,5.0,4.0,5.0,2.0,0.0,5.0,1.0,2.0,2.0,5.0,5.0,1.0,3.0,4.0,0.0,2.0,2.0,0.0,4.0,4.0,1.0,1.0,5.0,4.0,1.0,3.0,2.0,3.0,2.0,1.0,0.0,3.0,3.0,5.0,3.0,5.0,4.0,3.0,3.0,5.0,5.0,4.0,5.0,5.0,5.0,5.0,4.0,5.0,5.0,5.0,5.0,5.0,5.0,2.0,5.0,2.0,3.0,5.0,5.0,4.0,4.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,3.0,4.0,4.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,3.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,4.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,4.0,5.0,5.0,4.0,5.0,5.0,5.0,5.0,5.0,2.0,5.0,5.0,5.0,5.0,5.0,5.0,3.0,5.0,5.0,5.0,5.0,5.0,4.0,5.0,5.0,5.0,5.0,4.0,5.0,5.0,4.0,5.0,5.0,4.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,4.0,5.0,4.0,4.0,5.0,5.0,5.0,4.0,4.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,4.0,4.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,0.0,5.0,3.0,5.0,5.0,5.0,5.0,4.0,5.0,5.0,5.0,5.0,5.0,4.0,4.0,5.0,5.0,5.0,4.0,5.0,5.0,5.0,5.0,5.0,5.0,4.0,3.0,5.0,5.0,5.0,4.0,4.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,4.0,4.0,4.0,5.0,5.0,4.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,4.0,4.0,5.0,5.0,5.0,5.0,5.0,5.0,4.0,5.0,4.0,4.0,5.0,4.0,4.0,5.0,5.0,5.0,5.0,5.0,4.0,4.0,4.0,4.0,5.0,5.0,5.0,5.0,5.0,4.0,5.0,5.0,5.0,4.0,5.0,4.0,5.0,5.0,5.0,5.0,5.0,5.0,4.0,4.0,5.0,4.0,5.0,5.0,2.0,1.0,2.0,4.0,4.0,2.0,5.0,4.0,2.0,1.0,4.0,2.0,5.0,3.0,3.0,5.0,5.0,5.0,2.0,2.0,4.0,1.0,4.0,2.0,2.0,3.0,4.0,1.0,3.0,4.0,5.0,5.0,1.0,4.0,2.0,1.0,3.0,1.0,5.0,0.0,4.0,3.0,4.0,5.0,2.0,1.0,4.0,1.0,3.0,4.0,0.0,2.0,4.0,5.0,5.0,5.0,5.0,4.0,4.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,0.0,4.0,5.0,0.0,2.0,0.0,0.0,0.0,0.0,3.0,0.0,2.0,3.0,0.0,2.0,4.0,2.0,3.0,3.0,0.0,2.0]},"kind":"numeric","n":7124,"n_null":0,"n_unique":6,"null_rate":0.0,"stats":{"iqr":1.0,"kurtosis":1.5378029529129034,"max":5.0,"mean":4.054042672655811,"median":5.0,"min":0.0,"n_outliers":961,"outlier_rate":0.1348961257720382,"q1":4.0,"q3":5.0,"skew":-1.5132565549798649,"std":1.3417869392093136,"zero_rate":0.0381807973048849}},{"alerts":[{"code":"null_rate","level":"warn","message":"45.8% null"}],"column":"BibleYear","extras":{"singletons":45,"top_values":[["1818-2022",662],["1809-2022",357],["1954",191],["1843-2022",167],["1823-2021",155],["1815-2021",150],["1895-2020",146],["1854-2022",136],["1959-2021",131],["1727-2024",129],["1821-2024",96],["1827-2024",90],["1841-2022",85],["2008",80],["1914-2024",71],["1827-2009",55],["1874-2018",50],["2023",43],["1883-2018",36],["1838-2023",36]]},"kind":"categorical","n":7124,"n_null":3262,"n_unique":163,"null_rate":0.45788882650196516,"stats":{"cardinality":163,"entropy":5.318460632512652,"entropy_ratio":0.7237253196596358,"top_rate":0.17141377524598653,"top_value":"1818-2022"}},{"alerts":[{"code":"null_rate","level":"warn","message":"24.6% null"}],"column":"NTYear","extras":{"singletons":99,"top_values":[["1811-1998",662],["1801-1984",357],["Yes",345],["1890-1992",191],["1758-2000",167],["1820-1985",155],["1809-2000",150],["1818-1991",146],["2023-2024",146],["1818-1989",136],["1815-2011",131],["1819-2021",130],["1715-1998",129],["1978-2022",110],["1827-2023",100],["1811-1982",96],["1829-1995",85],["2010",83],["1819-1993",77],["1821-2010",71]]},"kind":"categorical","n":7124,"n_null":1756,"n_unique":305,"null_rate":0.24649073554183043,"stats":{"cardinality":305,"entropy":6.065197651022559,"entropy_ratio":0.734938027073488,"top_rate":0.12332339791356185,"top_value":"1811-1998"}},{"alerts":[],"column":"PortionsYear","extras":{"singletons":171,"top_values":[["Yes",821],["1806-1962",662],["1800-1980",357],["1825-1981",191],["1747-1894",167],["1809-1965",155],["1811-1956",150],["1824-2010",146],["1812-1966",136],["1818-1954",131],["1885-1922",130],["1714-1956",129],["1927-1964",110],["1807-1957",96],["1812-1988",90],["1811-1968",85],["2024",73],["1850-1961",71],["1782-1985",55],["1939-2021",52]]},"kind":"categorical","n":7124,"n_null":961,"n_unique":460,"null_rate":0.1348961257720382,"stats":{"cardinality":460,"entropy":6.289018265346477,"entropy_ratio":0.7109858503175909,"top_rate":0.1332143436638001,"top_value":"Yes"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"TranslationNeedQuestionable","extras":{},"kind":"unknown","n":7124,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"constant","level":"info","message":"only one distinct value"}],"column":"JPScale","extras":{"histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,7124,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[0.5,0.525,0.55,0.575,0.6,0.625,0.65,0.675,0.7,0.725,0.75,0.775,0.8,0.825,0.8500000000000001,0.875,0.9,0.925,0.95,0.9750000000000001,1.0,1.025,1.05,1.0750000000000002,1.1,1.125,1.15,1.175,1.2000000000000002,1.225,1.25,1.275,1.3,1.3250000000000002,1.35,1.375,1.4,1.425,1.4500000000000002,1.475,1.5]},"sample":[1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0]},"kind":"numeric","n":7124,"n_null":0,"n_unique":1,"null_rate":0.0,"stats":{"iqr":0.0,"kurtosis":0.0,"max":1.0,"mean":1.0,"median":1.0,"min":1.0,"n_outliers":0,"outlier_rate":0.0,"q1":1.0,"q3":1.0,"skew":0.0,"std":0.0,"zero_rate":0.0}},{"alerts":[],"column":"JPScalePC","extras":{"singletons":0,"top_values":[["1",5001],["4",1141],["2",525],["5",252],["3",205]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":5,"null_rate":0.0,"stats":{"cardinality":5,"entropy":1.3766663059887423,"entropy_ratio":0.5928979062788441,"top_rate":0.7019932622122403,"top_value":"1"}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 97.0% of rows"}],"column":"JPScalePGAC","extras":{"singletons":0,"top_values":[["1",6910],["4",118],["2",75],["5",15],["3",6]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":5,"null_rate":0.0,"stats":{"cardinality":5,"entropy":0.23715595566297726,"entropy_ratio":0.10213751071153726,"top_rate":0.9699606962380685,"top_value":"1"}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"LeastReached","extras":{"singletons":0,"top_values":[["Y",7124]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":1,"null_rate":0.0,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Y"}},{"alerts":[],"column":"LeastReachedPC","extras":{"singletons":0,"top_values":[["Y",5152],["N",1972]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":2,"null_rate":0.0,"stats":{"cardinality":2,"entropy":0.8510687969770052,"entropy_ratio":0.8510687969770052,"top_rate":0.7231892195395845,"top_value":"Y"}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 97.0% of rows"}],"column":"LeastReachedPGAC","extras":{"singletons":0,"top_values":[["Y",6910],["N",214]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":2,"null_rate":0.0,"stats":{"cardinality":2,"entropy":0.19458892596905494,"entropy_ratio":0.19458892596905494,"top_rate":0.9699606962380685,"top_value":"Y"}},{"alerts":[],"column":"GSEC","extras":{"singletons":0,"top_values":[["",3639],["1",2767],["4",186],["0",176],["2",139],["3",100],["6",62],["5",55]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":8,"null_rate":0.0,"stats":{"cardinality":8,"entropy":1.6051409062515756,"entropy_ratio":0.5350469687505252,"top_rate":0.5108085345311623,"top_value":""}},{"alerts":[],"column":"HasAudioRecordings","extras":{"singletons":0,"top_values":[["Y",6188],["N",936]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":2,"null_rate":0.0,"stats":{"cardinality":2,"entropy":0.5612294270509872,"entropy_ratio":0.5612294270509872,"top_rate":0.8686131386861314,"top_value":"Y"}},{"alerts":[{"code":"null_rate","level":"warn","message":"22.4% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"NTOnline","extras":{"singletons":0,"top_values":[["Y",5528]]},"kind":"categorical","n":7124,"n_null":1596,"n_unique":1,"null_rate":0.2240314430095452,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Y"}},{"alerts":[{"code":"outliers","level":"warn","message":"10.6% rows beyond 1.5 IQR"}],"column":"RLG3","extras":{"histogram":{"counts":[480,0,0,0,0,0,0,0,0,0,0,933,0,0,0,0,0,2142,0,0,0,0,3279,0,0,0,0,0,13,0,0,0,0,0,120,0,0,0,0,157],"edges":[2.0,2.175,2.35,2.525,2.7,2.875,3.05,3.2249999999999996,3.4,3.575,3.75,3.925,4.1,4.275,4.449999999999999,4.625,4.8,4.975,5.15,5.324999999999999,5.5,5.675,5.85,6.0249999999999995,6.199999999999999,6.375,6.55,6.725,6.8999999999999995,7.074999999999999,7.25,7.425,7.6,7.7749999999999995,7.949999999999999,8.125,8.3,8.475,8.649999999999999,8.825,9.0]},"sample":[6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,8.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,2.0,2.0,4.0,4.0,4.0,4.0,2.0,4.0,2.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,7.0,6.0,4.0,6.0,6.0,6.0,4.0,6.0,4.0,4.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,8.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,4.0,6.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,4.0,6.0,6.0,4.0,6.0,6.0,6.0,4.0,4.0,2.0,2.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,6.0,2.0,4.0,4.0,4.0,2.0,4.0,4.0,4.0,2.0,4.0,4.0,4.0,4.0,2.0,4.0,4.0,4.0,4.0,4.0,2.0,6.0,6.0,2.0,5.0,5.0,5.0,5.0,2.0,5.0,6.0,5.0,5.0,5.0,5.0,6.0,2.0,2.0,6.0,6.0,6.0,6.0,6.0,5.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,5.0,5.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,6.0,5.0,5.0,6.0,6.0,5.0,5.0,6.0,5.0,5.0,6.0,5.0,6.0,5.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,2.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,8.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,5.0,5.0,6.0,6.0,5.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,5.0,6.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,6.0,5.0,5.0,6.0,5.0,8.0,8.0,5.0,6.0,5.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,5.0,5.0,2.0,6.0,5.0,5.0,5.0,5.0,2.0,5.0,6.0,5.0,5.0,6.0,5.0,6.0,6.0,5.0,5.0,6.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,8.0,6.0,5.0,5.0,5.0,5.0,6.0,6.0,6.0,8.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,2.0,5.0,6.0,5.0,5.0,6.0,5.0,5.0,6.0,6.0,6.0,6.0,5.0,5.0,5.0,5.0,6.0,8.0,6.0,6.0,5.0,6.0,6.0,5.0,8.0,6.0,6.0,5.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,8.0,6.0,6.0,6.0,6.0,5.0,8.0,6.0,6.0,6.0,6.0,6.0,4.0,4.0,6.0,4.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,4.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,4.0,6.0,6.0,6.0,6.0,6.0,2.0,2.0,4.0,4.0,2.0,4.0,4.0,4.0,4.0,2.0,4.0,4.0,4.0,2.0,4.0,4.0,2.0,4.0,4.0,2.0,4.0,2.0,4.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,4.0,6.0,2.0,6.0,6.0,6.0,6.0,6.0,2.0,4.0,6.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0]},"kind":"numeric","n":7124,"n_null":0,"n_unique":7,"null_rate":0.0,"stats":{"iqr":1.0,"kurtosis":2.000736662406161,"max":9.0,"mean":5.269511510387423,"median":6.0,"min":2.0,"n_outliers":757,"outlier_rate":0.10626052779337451,"q1":5.0,"q3":6.0,"skew":-0.4551183828899757,"std":1.279353531429903,"zero_rate":0.0}},{"alerts":[{"code":"outliers","level":"warn","message":"14.3% rows beyond 1.5 IQR"}],"column":"RLG3PC","extras":{"histogram":{"counts":[332,0,0,0,0,474,0,0,0,0,0,0,0,0,0,666,0,0,0,0,2296,0,0,0,0,3105,0,0,0,0,35,0,0,0,0,62,0,0,0,154],"edges":[1.0,1.2,1.4,1.6,1.8,2.0,2.2,2.4000000000000004,2.6,2.8,3.0,3.2,3.4000000000000004,3.6,3.8000000000000003,4.0,4.2,4.4,4.6,4.800000000000001,5.0,5.2,5.4,5.6000000000000005,5.800000000000001,6.0,6.2,6.4,6.6000000000000005,6.800000000000001,7.0,7.2,7.4,7.6000000000000005,7.800000000000001,8.0,8.2,8.4,8.600000000000001,8.8,9.0]},"sample":[6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,1.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,2.0,2.0,7.0,1.0,7.0,2.0,2.0,2.0,2.0,6.0,6.0,6.0,1.0,1.0,1.0,6.0,6.0,6.0,1.0,1.0,1.0,1.0,1.0,1.0,6.0,6.0,6.0,6.0,1.0,1.0,1.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,1.0,1.0,1.0,1.0,4.0,4.0,1.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,4.0,6.0,6.0,6.0,4.0,6.0,1.0,2.0,2.0,2.0,2.0,4.0,4.0,2.0,2.0,4.0,4.0,1.0,4.0,2.0,4.0,4.0,4.0,4.0,4.0,2.0,4.0,2.0,2.0,4.0,4.0,4.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,6.0,6.0,2.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,5.0,5.0,5.0,5.0,6.0,2.0,2.0,6.0,6.0,6.0,6.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,6.0,5.0,5.0,6.0,6.0,5.0,5.0,6.0,5.0,5.0,6.0,5.0,6.0,5.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,5.0,5.0,6.0,6.0,5.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,5.0,6.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,5.0,5.0,5.0,6.0,5.0,8.0,8.0,5.0,6.0,5.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,5.0,5.0,2.0,6.0,5.0,5.0,5.0,5.0,2.0,5.0,6.0,5.0,5.0,6.0,5.0,6.0,6.0,5.0,5.0,6.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,8.0,6.0,5.0,5.0,5.0,5.0,6.0,6.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,2.0,5.0,6.0,5.0,5.0,6.0,5.0,5.0,6.0,6.0,6.0,6.0,5.0,5.0,5.0,5.0,6.0,8.0,6.0,6.0,5.0,6.0,6.0,5.0,5.0,6.0,6.0,5.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,5.0,5.0,6.0,6.0,6.0,6.0,6.0,6.0,1.0,6.0,6.0,6.0,6.0,6.0,1.0,6.0,1.0,1.0,6.0,1.0,6.0,6.0,6.0,1.0,6.0,6.0,1.0,6.0,6.0,1.0,6.0,6.0,6.0,6.0,6.0,6.0,1.0,6.0,2.0,2.0,4.0,4.0,2.0,4.0,4.0,4.0,4.0,2.0,4.0,4.0,4.0,4.0,4.0,4.0,2.0,4.0,4.0,2.0,4.0,1.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0]},"kind":"numeric","n":7124,"n_null":0,"n_unique":8,"null_rate":0.0,"stats":{"iqr":1.0,"kurtosis":1.7031346777823853,"max":9.0,"mean":5.078747894441325,"median":5.0,"min":1.0,"n_outliers":1022,"outlier_rate":0.14345873104997192,"q1":5.0,"q3":6.0,"skew":-0.9462904179989621,"std":1.5204545024551042,"zero_rate":0.0}},{"alerts":[{"code":"outliers","level":"warn","message":"10.9% rows beyond 1.5 IQR"}],"column":"RLG3PGAC","extras":{"histogram":{"counts":[17,0,0,0,0,466,0,0,0,0,0,0,0,0,0,925,0,0,0,0,2154,0,0,0,0,3247,0,0,0,0,22,0,0,0,0,131,0,0,0,162],"edges":[1.0,1.2,1.4,1.6,1.8,2.0,2.2,2.4000000000000004,2.6,2.8,3.0,3.2,3.4000000000000004,3.6,3.8000000000000003,4.0,4.2,4.4,4.6,4.800000000000001,5.0,5.2,5.4,5.6000000000000005,5.800000000000001,6.0,6.2,6.4,6.6000000000000005,6.800000000000001,7.0,7.2,7.4,7.6000000000000005,7.800000000000001,8.0,8.2,8.4,8.600000000000001,8.8,9.0]},"sample":[6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,8.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,2.0,2.0,4.0,1.0,4.0,4.0,2.0,4.0,2.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,7.0,6.0,4.0,6.0,6.0,4.0,4.0,6.0,4.0,4.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,8.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,4.0,6.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,4.0,6.0,6.0,4.0,6.0,6.0,6.0,4.0,4.0,2.0,2.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,6.0,2.0,4.0,4.0,4.0,2.0,4.0,4.0,4.0,2.0,4.0,4.0,4.0,4.0,2.0,4.0,4.0,4.0,4.0,4.0,2.0,6.0,6.0,2.0,5.0,5.0,5.0,5.0,2.0,5.0,6.0,5.0,5.0,5.0,5.0,6.0,2.0,2.0,6.0,8.0,8.0,6.0,6.0,5.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,5.0,5.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,6.0,5.0,5.0,6.0,6.0,5.0,5.0,6.0,5.0,5.0,6.0,5.0,6.0,5.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,2.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,8.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,5.0,5.0,6.0,6.0,5.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,5.0,6.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,6.0,5.0,5.0,6.0,5.0,8.0,8.0,5.0,6.0,5.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,5.0,5.0,2.0,6.0,5.0,5.0,5.0,5.0,2.0,5.0,6.0,5.0,5.0,6.0,5.0,6.0,6.0,5.0,5.0,6.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,8.0,6.0,5.0,5.0,5.0,5.0,6.0,6.0,6.0,8.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,6.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,2.0,5.0,6.0,5.0,5.0,6.0,5.0,5.0,6.0,6.0,6.0,6.0,5.0,5.0,5.0,5.0,6.0,8.0,6.0,6.0,5.0,6.0,6.0,5.0,8.0,6.0,6.0,5.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,8.0,6.0,6.0,6.0,6.0,5.0,8.0,6.0,6.0,6.0,6.0,6.0,4.0,4.0,6.0,4.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,4.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,4.0,6.0,6.0,6.0,6.0,6.0,2.0,2.0,4.0,4.0,2.0,4.0,4.0,4.0,4.0,2.0,4.0,4.0,4.0,2.0,4.0,4.0,2.0,4.0,4.0,2.0,4.0,2.0,4.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,4.0,6.0,2.0,6.0,6.0,6.0,6.0,6.0,2.0,4.0,6.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0,9.0]},"kind":"numeric","n":7124,"n_null":0,"n_unique":8,"null_rate":0.0,"stats":{"iqr":1.0,"kurtosis":2.0320188202721416,"max":9.0,"mean":5.272459292532285,"median":5.5,"min":1.0,"n_outliers":776,"outlier_rate":0.10892756878158338,"q1":5.0,"q3":6.0,"skew":-0.46373196210921297,"std":1.296230266472596,"zero_rate":0.0}},{"alerts":[],"column":"PrimaryReligion","extras":{"singletons":0,"top_values":[["Islam",3279],["Hinduism",2142],["Ethnic Religions",933],["Buddhism",480],["Unknown",157],["Other / Small",120],["Non-Religious",13]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":7,"null_rate":0.0,"stats":{"cardinality":7,"entropy":1.9199658428956226,"entropy_ratio":0.6839056322413325,"top_rate":0.46027512633352047,"top_value":"Islam"}},{"alerts":[],"column":"PrimaryReligionPC","extras":{"singletons":0,"top_values":[["Islam",3105],["Hinduism",2296],["Ethnic Religions",666],["Buddhism",474],["Christianity",332],["Unknown",154],["Other / Small",62],["Non-Religious",35]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":8,"null_rate":0.0,"stats":{"cardinality":8,"entropy":2.05141787159492,"entropy_ratio":0.6838059571983067,"top_rate":0.4358506457046603,"top_value":"Islam"}},{"alerts":[],"column":"PrimaryReligionPGAC","extras":{"singletons":0,"top_values":[["Islam",3247],["Hinduism",2154],["Ethnic Religions",925],["Buddhism",466],["Unknown",162],["Other / Small",131],["Non-Religious",22],["Christianity",17]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":8,"null_rate":0.0,"stats":{"cardinality":8,"entropy":1.95487684471231,"entropy_ratio":0.6516256149041033,"top_rate":0.45578326782706347,"top_value":"Islam"}},{"alerts":[{"code":"null_rate","level":"warn","message":"92.4% null"},{"code":"outliers","level":"warn","message":"5.5% rows beyond 1.5 IQR"}],"column":"RLG4","extras":{"histogram":{"counts":[107,9,0,120,1,0,20,160,2,3,11,79,0,0,0,0,0,4,0,2,8,6,10],"edges":[10.0,11.26086956521739,12.521739130434783,13.782608695652174,15.043478260869566,16.304347826086957,17.565217391304348,18.826086956521742,20.086956521739133,21.347826086956523,22.608695652173914,23.869565217391305,25.130434782608695,26.391304347826086,27.65217391304348,28.91304347826087,30.17391304347826,31.434782608695652,32.69565217391305,33.95652173913044,35.21739130434783,36.47826086956522,37.73913043478261,39.0]},"sample":[20.0,20.0,20.0,20.0,20.0,32.0,32.0,32.0,32.0,20.0,20.0,20.0,20.0,37.0,37.0,37.0,37.0,37.0,37.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,18.0,12.0,20.0,20.0,12.0,12.0,12.0,12.0,12.0,11.0,11.0,11.0,11.0,11.0,11.0,11.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,18.0,20.0,20.0,20.0,20.0,18.0,18.0,20.0,25.0,25.0,25.0,25.0,25.0,25.0,25.0,25.0,25.0,20.0,18.0,18.0,18.0,18.0,18.0,18.0,20.0,20.0,18.0,18.0,20.0,25.0,18.0,35.0,35.0,39.0,39.0,39.0,39.0,39.0,39.0,39.0,39.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,14.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,12.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,20.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,22.0,20.0,20.0,20.0,10.0,10.0,20.0,11.0,10.0,20.0,11.0,36.0,36.0,14.0,20.0,20.0,20.0,20.0,10.0,20.0,20.0,11.0,20.0,20.0,20.0,20.0,20.0,20.0,11.0,20.0,20.0,20.0,23.0,24.0,24.0,23.0,23.0,24.0,38.0,20.0,24.0,18.0,36.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,24.0,11.0,11.0,11.0,11.0,24.0,24.0,24.0,11.0,23.0,23.0,23.0,23.0,24.0,24.0,24.0,24.0,24.0,23.0,24.0,36.0,36.0,36.0,36.0,24.0,24.0,24.0,24.0,24.0,23.0,24.0,23.0,24.0,24.0,24.0,24.0,24.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,21.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,21.0,20.0,20.0,12.0,10.0,10.0,10.0,10.0,10.0,11.0,11.0,10.0,11.0,10.0,11.0,10.0,11.0,11.0,11.0,11.0,11.0,11.0,11.0,11.0,11.0,11.0,11.0,11.0,11.0,10.0,11.0,11.0,11.0,11.0,11.0,11.0,11.0,11.0,11.0,11.0,11.0,11.0,12.0,11.0,11.0,11.0,11.0,11.0,10.0,11.0,11.0,18.0,18.0,18.0,20.0,20.0,20.0,20.0,20.0,18.0,20.0,20.0,20.0,11.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,20.0,11.0,11.0,18.0]},"kind":"numeric","n":7124,"n_null":6582,"n_unique":18,"null_rate":0.9239191465468838,"stats":{"iqr":6.0,"kurtosis":1.4744121935907168,"max":39.0,"mean":18.186346863468636,"median":20.0,"min":10.0,"n_outliers":30,"outlier_rate":0.055350553505535055,"q1":14.0,"q3":20.0,"skew":1.05101740129186,"std":6.47248962416443,"zero_rate":0.0}},{"alerts":[{"code":"null_rate","level":"warn","message":"92.4% null"}],"column":"ReligionSubdivision","extras":{"singletons":2,"top_values":[["Sunni",160],["Judaism",120],["Sikhism",68],["Tibetan",58],["Theravada",49],["Shia",20],["Zoroastrianism",11],["Jainism",11],["Mahayana",9],["Prakriti",9],["Kirati",8],["Mandaeism",6],["Druze",4],["Baha'i",3],["Shia Imami Ismaili",2],["Syncretized",2],["Lingayat",1],["Animism",1]]},"kind":"categorical","n":7124,"n_null":6582,"n_unique":18,"null_rate":0.9239191465468838,"stats":{"cardinality":18,"entropy":2.984296845820131,"entropy_ratio":0.7156715875676203,"top_rate":0.2952029520295203,"top_value":"Sunni"}},{"alerts":[],"column":"PCIslam","extras":{"histogram":{"counts":[3635,26,22,13,17,9,9,8,20,1,11,5,21,10,7,7,12,2,4,1,9,3,4,5,11,3,15,14,30,13,25,22,39,20,43,45,103,109,226,2536],"edges":[0.0,2.5,5.0,7.5,10.0,12.5,15.0,17.5,20.0,22.5,25.0,27.5,30.0,32.5,35.0,37.5,40.0,42.5,45.0,47.5,50.0,52.5,55.0,57.5,60.0,62.5,65.0,67.5,70.0,72.5,75.0,77.5,80.0,82.5,85.0,87.5,90.0,92.5,95.0,97.5,100.0]},"sample":[99.9,97.9,94.5,97.0,99.2,100.0,100.0,95.8,97.3,95.4,96.0,97.0,97.0,0.0,99.8499984741211,94.9,100.0,100.0,100.0,99.9100036621094,99.8,100.0,99.99,97.2,99.6,99.9,100.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,99.98,97.9668674698795,94.6,94.7,93.0,90.0,100.0,100.0,95.0,95.0,100.0,0.0,100.0,15.0,99.9,99.5,100.0,6.0,97.0,0.0,0.0,99.8,99.97,100.0,94.0,94.0,98.0,100.0,0.0,99.409,98.0,97.0,100.0,99.95,100.0,100.0,100.0,100.0,0.0,99.94,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,99.8491964505792,0.0,25.0,98.0,33.0,98.0,32.8,99.9893834586466,0.0,99.9909090909091,4.0,100.0,95.0,0.0,100.0,99.6,40.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,99.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,14.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,96.0,85.0,0.0,5.0,30.0,9.39999961853027,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,30.0,3.0,100.0,60.0,12.0,9.0,10.0,99.9899978637695,100.0,100.0,0.0,98.3529411764706,0.0,100.0,0.0,0.0,0.00402000070470132,1.10356536502547,100.0,0.0846540529218739,0.0,100.0,0.0,0.353021045485404,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0514006682086867,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0409465011214792,0.0,0.0,0.0,11.9403823889757,0.0,100.0,0.388828884431415,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,0.0,0.0,0.0,100.0,0.0,0.0,0.0,0.0,0.22548931180662,0.0,0.147629316746571,100.0,0.0,100.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,98.1727574750831,100.0,0.0,0.0,100.0,100.0,0.0,0.0,100.0,100.0,0.0,0.0,100.0,99.9986429574169,0.0,100.0,100.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,99.9976470588235,100.0,0.0,0.0,0.0,0.0,0.0,100.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,0.0,100.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.162611240871596,0.0,0.0,0.0,35.0,29.0,40.0,30.0,0.0,0.0,100.0,0.0,0.0,99.9877450980392,0.0,100.0,100.0,0.0,100.0,100.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,0.0,0.0,0.0,0.0,100.0,100.0,100.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,0.146818923327896,0.0,0.0,0.0,0.0,0.0,0.0,0.143938495927387,0.0,100.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,1.61851459688398,0.0,0.0,0.261845386533666,0.0,100.0,100.0,0.0,99.9999563228944,0.0,0.0,0.0,0.0,100.0,100.0,100.0,0.0,0.0,100.0,100.0,0.0,100.0,100.0,100.0,0.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,0.0,99.9920454545454,100.0,100.0,0.142450142450142,94.0,83.0,73.0,99.0,30.0,100.0,99.9261290322581,99.4693661971831,88.0,75.0,91.0,93.0,92.0,65.0,80.0,19.0,96.0,95.0,100.0,100.0,100.0,98.0,100.0,2.0,86.0,98.0,95.0,99.937,88.3,95.0,69.98,71.0,100.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,78.0,76.0,85.0,65.899,99.82373879152,100.0,99.9751550508861,100.0,100.0,79.7,83.0,97.95,0.0,99.9933,98.6,96.8000030517578,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0]},"kind":"numeric","n":7124,"n_null":9,"n_unique":902,"null_rate":0.0012633352049410444,"stats":{"iqr":99.99,"kurtosis":-1.9346644616554267,"max":100.0,"mean":45.223052263489045,"median":0.275292498279422,"min":0.0,"n_outliers":0,"outlier_rate":0.0,"q1":0.0,"q3":99.99,"skew":0.17034253632439114,"std":48.21923220831275,"zero_rate":0.47125790583274774}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=+9.11"},{"code":"outliers","level":"warn","message":"12.5% rows beyond 1.5 IQR"}],"column":"PCNonReligious","extras":{"histogram":{"counts":[6442,159,222,34,73,17,48,18,32,3,9,4,12,5,3,2,2,1,2,2,3,1,2,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,2,1],"edges":[0.0,2.475,4.95,7.425000000000001,9.9,12.375,14.850000000000001,17.325,19.8,22.275000000000002,24.75,27.225,29.700000000000003,32.175000000000004,34.65,37.125,39.6,42.075,44.550000000000004,47.025,49.5,51.975,54.45,56.925000000000004,59.400000000000006,61.875,64.35000000000001,66.825,69.3,71.775,74.25,76.72500000000001,79.2,81.675,84.15,86.625,89.10000000000001,91.575,94.05,96.525,99.0]},"sample":[0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,0.3,0.0,0.0,0.0,0.0,0.0,0.0,0.0,4.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,14.0,10.0,5.0,0.0,40.0,34.0,0.0,0.0,0.0,50.0,0.0,0.0,0.0,15.0,5.0,5.0,0.0,12.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,22.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,4.0,4.0,15.0,20.0,0.0,10.0,10.0,15.0,14.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,4.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,4.2,0.0,0.0,4.0,0.0,7.0,0.0,0.0,3.0,4.8,0.0,5.0,18.8,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.5,2.5,0.0,0.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.36,0.0,0.0,0.0,3.4,1.0,0.0,4.5,3.0,0.0,6.0,6.0,5.0,0.0,4.5,5.0,5.3,5.0,0.0,0.0,0.0,10.0,15.0,0.0,0.0,10.0,0.0,10.0,0.0,0.0,0.0,0.0,0.0,10.0,0.0,0.0,0.0,2.0,0.0,2.0,54.5,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0]},"kind":"numeric","n":7124,"n_null":23,"n_unique":152,"null_rate":0.0032285233015160023,"stats":{"iqr":0.0,"kurtosis":125.34950353242786,"max":99.0,"mean":1.0164019153311528,"median":0.0,"min":0.0,"n_outliers":886,"outlier_rate":0.1247711589916913,"q1":0.0,"q3":0.0,"skew":9.105052230744263,"std":4.548800786327761,"zero_rate":0.8752288410083087}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=+6.45"},{"code":"outliers","level":"warn","message":"7.2% rows beyond 1.5 IQR"}],"column":"PCUnknown","extras":{"histogram":{"counts":[6885,20,9,10,6,2,3,0,0,2,0,2,0,2,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,1,0,0,0,2,152],"edges":[0.0,2.5,5.0,7.5,10.0,12.5,15.0,17.5,20.0,22.5,25.0,27.5,30.0,32.5,35.0,37.5,40.0,42.5,45.0,47.5,50.0,52.5,55.0,57.5,60.0,62.5,65.0,67.5,70.0,72.5,75.0,77.5,80.0,82.5,85.0,87.5,90.0,92.5,95.0,97.5,100.0]},"sample":[0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.254662572091978,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,8.64816399722868,0.0,0.0,0.0,0.138190954773869,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.157051617631662,0.0,0.0,0.0453926463912846,99.4736842105263,0.0,0.0,0.0,0.0,0.0,0.0712606453542195,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0500062507813477,0.0,0.0,0.0,0.0,0.0430502539964986,0.0,0.0,0.0308706974086075,0.0,0.0,0.0,0.142108782880071,0.0,0.0,0.67933244265302,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.156349182681452,2.51853626718848,0.0,0.0,0.0,0.0,0.0,0.306747659411724,0.0,0.0,0.0,0.0,0.0,0.0,0.0680139914496696,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.183203659493098,0.4624880844077,0.0,0.761296660117878,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.66111226827744,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.51074081509737,6.92574850299401,5.5032041055858,0.0,0.0,0.0,0.0,0.0935751314730597,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.423536530025715,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.451092117758784,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.03,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,99.0,100.0,100.0,99.0,99.0,100.0,99.0,100.0,99.0,99.0,99.9861111111111,100.0,99.0,99.0,99.0]},"kind":"numeric","n":7124,"n_null":25,"n_unique":388,"null_rate":0.0035092644581695676,"stats":{"iqr":0.0,"kurtosis":39.85161622984472,"max":100.0,"mean":2.2800663430047483,"median":0.0,"min":0.0,"n_outliers":510,"outlier_rate":0.07184110438089872,"q1":0.0,"q3":0.0,"skew":6.453884067610767,"std":14.590995101482848,"zero_rate":0.9281588956191013}},{"alerts":[{"code":"outliers","level":"warn","message":"24.9% rows beyond 1.5 IQR"}],"column":"SecurityLevel","extras":{"histogram":{"counts":[1114,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,657,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,5353],"edges":[0.0,0.05,0.1,0.15000000000000002,0.2,0.25,0.30000000000000004,0.35000000000000003,0.4,0.45,0.5,0.55,0.6000000000000001,0.65,0.7000000000000001,0.75,0.8,0.8500000000000001,0.9,0.9500000000000001,1.0,1.05,1.1,1.1500000000000001,1.2000000000000002,1.25,1.3,1.35,1.4000000000000001,1.4500000000000002,1.5,1.55,1.6,1.6500000000000001,1.7000000000000002,1.75,1.8,1.85,1.9000000000000001,1.9500000000000002,2.0]},"sample":[2.0,2.0,0.0,2.0,2.0,0.0,1.0,0.0,2.0,0.0,2.0,2.0,0.0,0.0,2.0,0.0,0.0,2.0,2.0,2.0,0.0,2.0,2.0,1.0,2.0,2.0,1.0,0.0,0.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,1.0,1.0,0.0,0.0,0.0,2.0,0.0,2.0,0.0,0.0,2.0,1.0,2.0,1.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,2.0,2.0,2.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,2.0,2.0,2.0,2.0,2.0,2.0,0.0,2.0,1.0,2.0,2.0,2.0,0.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,0.0,0.0,2.0,2.0,0.0,2.0,2.0,2.0,2.0,0.0,0.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,0.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,0.0,2.0,1.0,0.0,0.0,2.0,2.0,1.0,0.0,2.0,2.0,0.0,0.0,0.0,2.0,0.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,0.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,1.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,0.0,0.0,1.0,0.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,1.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,1.0,1.0,1.0,0.0,2.0,1.0,0.0,0.0,2.0,2.0,1.0,1.0,0.0,2.0,2.0,1.0,2.0,2.0,1.0,2.0,2.0,0.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,0.0,0.0,0.0,1.0,2.0,0.0,1.0,2.0,2.0,0.0,2.0,2.0,0.0,2.0,2.0,0.0,2.0,2.0,2.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,2.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,2.0,0.0]},"kind":"numeric","n":7124,"n_null":0,"n_unique":3,"null_rate":0.0,"stats":{"iqr":0.0,"kurtosis":0.4047744497320007,"max":2.0,"mean":1.5950308815272318,"median":2.0,"min":0.0,"n_outliers":1771,"outlier_rate":0.24859629421673218,"q1":2.0,"q3":2.0,"skew":-1.4661032147485806,"std":0.7441723699815839,"zero_rate":0.15637282425603594}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 98.6% of rows"}],"column":"LRTop100","extras":{"singletons":0,"top_values":[["N",7024],["Y",100]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":2,"null_rate":0.0,"stats":{"cardinality":2,"entropy":0.10650108565610678,"entropy_ratio":0.10650108565610678,"top_rate":0.9859629421673217,"top_value":"N"}},{"alerts":[{"code":"one_word","level":"warn","message":"100.0% rows are a single word"},{"code":"short_text","level":"info","message":"95th-percentile length under 20 chars"},{"code":"duplicates","level":"warn","message":"59.6% duplicate strings"}],"column":"PhotoAddress","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[1970,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,5092,0,0,0,0,0,0,0,0,61],"edges":[0.0,0.325,0.65,0.9750000000000001,1.3,1.625,1.9500000000000002,2.275,2.6,2.9250000000000003,3.25,3.575,3.9000000000000004,4.2250000000000005,4.55,4.875,5.2,5.525,5.8500000000000005,6.175,6.5,6.825,7.15,7.4750000000000005,7.800000000000001,8.125,8.450000000000001,8.775,9.1,9.425,9.75,10.075000000000001,10.4,10.725,11.05,11.375,11.700000000000001,12.025,12.35,12.675,13.0]},"near_unique":false,"sample":["p10375.jpg","p21768.jpg","p14099.jpg","p10812.jpg","p16826.jpg","p18274.jpg","p17080.jpg","","p10949.jpg","p13819.jpg","p19198.jpg","p17745.jpg","p18614.jpg","p10376.jpg","p19808.jpg","p21571.jpg","p10161.jpg","p11925.jpg","p19007_kn.jpg","","p11478.jpg","p13922.jpg","p12347.jpg","p11317.jpg","","","p17936.jpg","p10584.jpg","p12054.jpg","p18274.jpg","","p19007.jpg","p20235.jpg","p16500.jpg","","p16944.jpg","","","p17066.jpg","p17721.jpg","","p18628.jpg","p18577.jpg","p18619.jpg","p14039.jpg","p20631.jpg","p15382.jpg","","p10839.jpg","p16100.jpg"],"top_values":[["",1970],["p19007.jpg",90],["p18274.jpg",38],["p14371.jpg",36],["p12322.jpg",34],["p19211.jpg",34],["p12877.jpg",28],["p14983.jpg",27],["p11277.jpg",27],["p13819.jpg",25],["p15727.jpg",24],["p15104.jpg",23],["p13317.jpg",23],["p13437.jpg",22],["p19314.jpg",21],["p10953.jpg",20],["p11982.jpg",20],["p14483.jpg",19],["p10379.jpg",18],["p12247.jpg",18]],"top_words":[["p19007.jpg",90],["p18274.jpg",38],["p14371.jpg",36],["p12322.jpg",34],["p19211.jpg",34],["p12877.jpg",28],["p14983.jpg",27],["p11277.jpg",27],["p13819.jpg",25],["p15727.jpg",24],["p15104.jpg",23],["p13317.jpg",23],["p13437.jpg",22],["p19314.jpg",21],["p10953.jpg",20],["p11982.jpg",20],["p14483.jpg",19],["p10379.jpg",18],["p12247.jpg",18],["p15145.jpg",18],["p10790.jpg",17],["p11029.jpg",17],["p10375.jpg",16],["p15198.jpg",16],["p14256.jpg",16]],"vocab_skipped":null,"word_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,7123,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[0.5,0.5333333333333333,0.5666666666666667,0.6,0.6333333333333333,0.6666666666666666,0.7,0.7333333333333334,0.7666666666666666,0.8,0.8333333333333333,0.8666666666666667,0.9,0.9333333333333333,0.9666666666666667,1.0,1.0333333333333332,1.0666666666666667,1.1,1.1333333333333333,1.1666666666666665,1.2,1.2333333333333334,1.2666666666666666,1.3,1.3333333333333335,1.3666666666666667,1.4,1.4333333333333333,1.4666666666666668,1.5]}},"kind":"text","n":7124,"n_null":1,"n_unique":2880,"null_rate":0.00014037057832678272,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.5956759792222378,"emoji_rate":0.0,"len_max":13,"len_mean":7.2600028078057,"len_median":10.0,"len_min":0,"len_p95":10.0,"n_duplicates":4243,"n_empty":1970,"one_word_rate":1.0,"readability_flesch_mean":84.00800000000002,"url_rate":0.0,"vocab_size":2879,"word_mean":1.0,"word_median":1.0}},{"alerts":[{"code":"long_tail","level":"info","message":"463 singleton categories"}],"column":"PhotoCredits","extras":{"singletons":463,"top_values":[["",1970],["Anonymous",1496],["Operation China, Asia Harvest",263],["Isudas",212],["Kate Nelson/AusAID - Wikimedia",90],["manothegreek",77],["Kerry Olson",76],["Asia Harvest-Operation Myanmar",69],["Steve Evans - Flickr",62],["Final Sudan",43],["Rod Waddington - Flickr",42],["Peoples of Laos, Asia Harvest",41],["COMIBAM / Sepal",37],["Link Up Africa",36],["CharlesFred - Flickr",36],["Asia Harvest",36],["Hamed Saber - Flickr",36],["Peoples of the Buddhist World, Asia Harvest",36],["N-Y-C - Pixabay",34],["pxhere",34]]},"kind":"categorical","n":7124,"n_null":10,"n_unique":851,"null_rate":0.001403705783267827,"stats":{"cardinality":851,"entropy":5.583876588758368,"entropy_ratio":0.5737046952260549,"top_rate":0.2769187517570987,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"465 singleton categories"},{"code":"null_rate","level":"warn","message":"36.0% null"}],"column":"PhotoCreditURL","extras":{"singletons":465,"top_values":[["",1970],["https://www.asiaharvest.org",443],["https://tinyurl.com/89ffm33y",90],["https://www.pesquisas.org.br/",37],["https://flickr.com/photos/44124425616@N01/424972149/",36],["https://pixabay.com/photos/fashion-asian-japanese-chinese-4257900/",34],["https://pxhere.com/en/photo/637533",34],["https://www.newcovenantmissions.org",31],["https://www.createinternational.com",30],["https://pixabay.com/photos/person-face-people-portrait-smile-5039573/",27],["https://www.globalROAR.org",26],["https://pixabay.com/photos/bread-marrakesh-food-morocco-1166272/",25],["https://pixabay.com/photos/pakistani-model-boy-model-pakistan-3770152/",24],["https://commons.wikimedia.org/wiki/File:Sudanese_arab_from_manasir_tribe.jpg",23],["https://pixabay.com/photos/refugee-afghan-forest-geocaching-1189087/",21],["https://flickr.com/photos/91418149@N03/14204194758",20],["https://pixabay.com/pl/photos/m%c4%99%c5%bcczy%c5%bani-turban-portret-facet-2146800/",19],["https://commons.wikimedia.org/wiki/File:Algerian_man_with_turban.jpg",18],["https://commons.wikimedia.org/wiki/File:Iraqi_man_on_Baghdad_street.jpg",18],["https://flickr.com/photos/rosluc6460/3260871722",18]]},"kind":"categorical","n":7124,"n_null":2565,"n_unique":774,"null_rate":0.36005053340819765,"stats":{"cardinality":774,"entropy":5.389488265252065,"entropy_ratio":0.5616279379845728,"top_rate":0.43211230533011624,"top_value":""}},{"alerts":[],"column":"PhotoCreativeCommons","extras":{"singletons":0,"top_values":[["N",5682],["Y",1437]]},"kind":"categorical","n":7124,"n_null":5,"n_unique":2,"null_rate":0.0007018528916339135,"stats":{"cardinality":2,"entropy":0.7256210165446637,"entropy_ratio":0.7256210165446637,"top_rate":0.7981458069953645,"top_value":"N"}},{"alerts":[],"column":"PhotoCopyright","extras":{"singletons":0,"top_values":[["N",5735],["Y",1377]]},"kind":"categorical","n":7124,"n_null":12,"n_unique":2,"null_rate":0.0016844469399213925,"stats":{"cardinality":2,"entropy":0.7089757305249859,"entropy_ratio":0.7089757305249859,"top_rate":0.8063835770528683,"top_value":"N"}},{"alerts":[],"column":"PhotoPermission","extras":{"singletons":0,"top_values":[["N",5715],["Y",1393],["y",2]]},"kind":"categorical","n":7124,"n_null":14,"n_unique":3,"null_rate":0.0019651880965749578,"stats":{"cardinality":3,"entropy":0.7173304783646449,"entropy_ratio":0.45258514194390115,"top_rate":0.8037974683544303,"top_value":"N"}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 96.7% of rows"}],"column":"ProfileTextExists","extras":{"singletons":0,"top_values":[["Y",6888],["N",236]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":2,"null_rate":0.0,"stats":{"cardinality":2,"entropy":0.20984120374636117,"entropy_ratio":0.20984120374636117,"top_rate":0.9668725435148793,"top_value":"Y"}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=+5.67"},{"code":"outliers","level":"warn","message":"17.0% rows beyond 1.5 IQR"}],"column":"CountOfCountries","extras":{"histogram":{"counts":[5710,272,248,163,150,139,123,20,0,109,2,37,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,151],"edges":[1.0,5.075,9.15,13.225000000000001,17.3,21.375,25.450000000000003,29.525000000000002,33.6,37.675000000000004,41.75,45.825,49.900000000000006,53.975,58.050000000000004,62.125,66.2,70.275,74.35000000000001,78.425,82.5,86.575,90.65,94.72500000000001,98.80000000000001,102.875,106.95,111.025,115.10000000000001,119.17500000000001,123.25,127.325,131.4,135.475,139.55,143.625,147.70000000000002,151.775,155.85,159.925,164.0]},"sample":[8.0,18.0,18.0,3.0,1.0,2.0,3.0,21.0,21.0,21.0,9.0,9.0,13.0,6.0,25.0,25.0,2.0,4.0,4.0,3.0,3.0,2.0,1.0,8.0,1.0,1.0,5.0,38.0,38.0,1.0,2.0,1.0,2.0,1.0,1.0,1.0,1.0,10.0,1.0,20.0,20.0,20.0,13.0,7.0,9.0,4.0,4.0,3.0,1.0,4.0,1.0,27.0,27.0,2.0,2.0,1.0,1.0,1.0,1.0,5.0,28.0,28.0,28.0,28.0,28.0,10.0,3.0,39.0,39.0,1.0,15.0,3.0,1.0,4.0,1.0,10.0,2.0,4.0,4.0,4.0,8.0,4.0,3.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,22.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,27.0,27.0,1.0,1.0,2.0,1.0,1.0,2.0,1.0,6.0,6.0,1.0,1.0,3.0,6.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,20.0,20.0,1.0,22.0,22.0,2.0,2.0,1.0,7.0,2.0,2.0,26.0,26.0,26.0,1.0,20.0,1.0,13.0,21.0,21.0,1.0,6.0,2.0,24.0,2.0,2.0,5.0,1.0,1.0,1.0,2.0,2.0,3.0,1.0,1.0,2.0,1.0,1.0,2.0,5.0,2.0,3.0,1.0,1.0,1.0,2.0,1.0,3.0,1.0,1.0,1.0,3.0,1.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,3.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,3.0,2.0,1.0,1.0,2.0,2.0,2.0,1.0,3.0,3.0,1.0,2.0,1.0,1.0,1.0,2.0,1.0,5.0,1.0,4.0,2.0,3.0,1.0,2.0,2.0,1.0,2.0,3.0,1.0,2.0,2.0,2.0,1.0,5.0,2.0,1.0,2.0,2.0,2.0,3.0,1.0,2.0,1.0,2.0,1.0,1.0,1.0,1.0,3.0,2.0,1.0,1.0,2.0,1.0,2.0,1.0,2.0,1.0,4.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,4.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,47.0,47.0,47.0,47.0,1.0,1.0,5.0,2.0,2.0,1.0,1.0,2.0,2.0,2.0,1.0,1.0,1.0,1.0,1.0,3.0,2.0,1.0,3.0,2.0,1.0,1.0,2.0,1.0,2.0,1.0,1.0,2.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,2.0,2.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,3.0,1.0,1.0,1.0,1.0,1.0,2.0,3.0,1.0,1.0,2.0,1.0,1.0,2.0,1.0,1.0,4.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,2.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,2.0,2.0,1.0,4.0,1.0,1.0,1.0,9.0,1.0,10.0,2.0,1.0,1.0,1.0,3.0,1.0,1.0,1.0,5.0,1.0,2.0,9.0,2.0,1.0,11.0,11.0,1.0,20.0,20.0,1.0,1.0,4.0,1.0,15.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,10.0,10.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,3.0,3.0,1.0,1.0,1.0,2.0,13.0,16.0,16.0,10.0,3.0,3.0,1.0,2.0,3.0,13.0,3.0,10.0,10.0,10.0,38.0,1.0,1.0,1.0,1.0,164.0,164.0,164.0,164.0,164.0,164.0,164.0,164.0,164.0,164.0,164.0,164.0,164.0,164.0,164.0,164.0,164.0,164.0]},"kind":"numeric","n":7124,"n_null":0,"n_unique":39,"null_rate":0.0,"stats":{"iqr":3.0,"kurtosis":33.16729122666121,"max":164.0,"mean":8.10780460415497,"median":2.0,"min":1.0,"n_outliers":1210,"outlier_rate":0.16984839977540708,"q1":1.0,"q3":4.0,"skew":5.671675430589582,"std":24.27230750677605,"zero_rate":0.0}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"CountOfProvinces","extras":{},"kind":"unknown","n":7124,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[],"column":"Longitude","extras":{"histogram":{"counts":[6,2,0,0,0,11,16,2,8,15,48,110,29,24,8,10,0,46,139,229,217,249,173,356,244,243,104,781,1584,970,313,728,135,161,52,36,41,8,3,23],"edges":[-173.08406,-164.2960398,-155.50801959999998,-146.7199994,-137.9319792,-129.143959,-120.35593879999999,-111.56791859999998,-102.7798984,-93.99187819999999,-85.203858,-76.41583779999999,-67.62781759999999,-58.839797399999995,-50.05177719999999,-41.263757,-32.47573679999999,-23.687716599999987,-14.899696399999982,-6.111676200000005,2.6763440000000003,11.464364200000006,20.25238440000001,29.040404600000016,37.82842480000002,46.616445,55.404465200000004,64.19248540000001,72.98050560000001,81.76852580000002,90.556546,99.3445662,108.13258640000001,116.92060660000001,125.70862680000002,134.49664700000002,143.28466720000003,152.07268740000004,160.86070759999998,169.6487278,178.436748]},"sample":[44.22407,13.204459,4.75637000017537,57.11082,23.8228289998584,36.817477,-15.48,4.353942,44.3579454963875,4.881726,58.520528057324,32.73,-0.139529,-0.059751,55.22,-3.61282625412832,5.396386,-12.0447810004428,32.78,-7.3006,2.266761,42.8236170000245,-10.9665290001133,35.937201,-4.568162,41.1,106.923503,-77.0586138483504,100.534287,110.300647000159,117.48659771831,110.097773326678,119.753576941023,124.336234099724,100.689168522409,91.644805,102.016472,36.30381,46.7162,12.5204863523633,19.18231,-90.2762200879866,48.4884032371197,38.18185,59.5756493318511,19.698161,20.608977,73.8,82.473401,72.837668,35.153698443928,-79.5613999997102,28.202922,40.1,38.3514619998714,38.776079,36.693414,36.96,49.6434,46.62289,69.5952071480914,4.47702209609287,16.3428980518036,24.929606,8.547875,-79.359544,68.6194,12.537643,101.701698,70.92815,69.8194799999021,48.75287,70.86259,74.311695,53.3161,40.730514,71.563232,-55.38784,7.433619,6.13151,-73.94161,-74.6011,-46.4962341730686,-74.1699,34.74222,121.755455850223,16.47117,6.81777,-73.83543,-53.34406,-49.18320556,-50.0027416388888,-62.3588599722222,-63.64796,-78.47,105.26235,119.7989,121.78052,97.34887,102.83383,100.08121,103.277233446167,114.198579,105.165526874665,121.08259,102.96691,122.05304,112.619060922024,114.651815249187,114.55121,123.006219,131.98869,106.60577,105.45147,174.73,8.588308,107.186450072013,107.831132248155,101.1485,106.022676622628,104.97911,104.924415,102.453069035807,-118.18968753725,10.815328,105.75571,105.82539,103.077912988693,101.442001999593,106.37882,107.968159000338,102.4067,98.7269730763464,103.80432,104.36545,105.7313,105.74595,100.766798,96.55,106.749345,105.9151507,107.063317,104.713055555556,103.866851,2.31549996565087,46.7355936533244,83.208854,-9.141152,25.6441,87.5717956467024,73.4714351607671,86.3867838705642,174.742642,75.0264144693544,89.845198,5.1958,-3.95302,-1.4039,70.04196,174.74396,92.41449,69.09,55.401,46.69711,68.5455299996098,51.4698258465855,92.0608123066466,30.70614,82.3108769724513,78.9779850015885,80.7663188126322,75.5220691195217,84.7850943574839,75.9478015041647,78.814123890185,86.900645107557,83.4246222620641,73.8153586015435,85.7627182302543,74.751922537051,83.7309694703453,83.3039223235305,77.7063223535231,69.1119133873487,73.8558672269006,76.767620321331,86.1123255637936,85.0506147326963,75.2983816483942,68.5090413181024,76.8752965828173,84.519891604287,73.7610653199764,85.1300886847166,76.9543455818249,74.380651801771,75.9753148852528,76.8722420508313,77.0741423611576,77.8992871617743,86.8471138184018,88.727211363814,85.2125364624689,75.1491256046594,74.6199841400961,88.532974,74.9029960568785,87.492719878835,75.2213048758092,85.2549134349195,75.4694517121266,74.90458488535,77.6563412540874,87.0840136011006,75.7743932881766,78.7929392502301,78.5576303863458,76.9385191802047,85.3665562768667,82.1330009190645,85.054193,89.4366895435229,88.4192414412866,73.7226103250698,84.6113266855826,74.2567304023307,84.2167407140688,77.8797679263387,79.7295939818274,83.4402730404831,83.108493693789,77.7902537816703,80.568749,91.5005656753695,83.4033006907495,88.4373249053391,70.4782102259852,82.6817107293464,84.8147457738489,76.6571433654378,90.2773045468516,74.2037551775736,72.6660760242239,88.3373152116027,68.5158572423784,71.4416391496338,74.1305323059,73.3739839653559,70.4294927438062,74.3818091387675,67.0730022864913,77.4176258841282,87.8798349365771,74.7334050000551,74.3755924729531,77.2323335651938,80.7671359963885,84.8096752263879,85.2581996469606,84.8963493627036,75.2802928468983,92.096901315677,80.6783324477098,77.6510440556553,84.8745245126828,69.14856,83.6387642919897,90.5547810114123,83.9835118249687,86.7985464402267,85.0589971103576,71.4579794573767,77.0015896560613,77.4185674613576,71.2558269367288,70.2073008123344,77.5691647669235,76.9578737952867,76.4551635491965,78.4127883410893,68.0358754877,84.925514785117,70.0095780027521,85.1280525394305,76.8831721863116,76.5096122528139,72.6246382399864,71.0187380805677,84.425682,70.8864207887372,89.8968228336191,85.7794460828925,95.2074367136355,75.4597609601617,16.518863,24.947332,113.997702,173.15469,91.21506,78.4101994834501,84.8795415602041,75.8147842223173,88.4774926237139,71.4528021558617,77.7572725897409,77.9363974400517,73.2506797610194,68.50658,77.4419171629863,74.6371570817867,74.2236056886262,91.9662135780592,74.8417226994662,74.5712742434477,85.2348130135405,71.8598747678821,81.4505991494815,87.9672196957107,76.5394710584128,75.2139634933733,77.7237297794237,83.8274776692626,94.302454457839,78.1201108454573,77.1858778660992,76.9347316016324,70.47639,70.4246149300763,73.0805537324138,77.5967472303035,80.1976480054166,78.1436532777866,79.17923613682,78.1621425908289,70.13657,91.8561820239468,73.241,74.43368,81.960243,82.02917,76.5477728653989,78.5811225282082,81.6762019255426,83.6286567098446,82.7723705931273,72.1947172768386,80.5785683512211,69.9297155411401,84.1415756875649,89.4192697859321,76.318816549546,72.8972081032305,78.0104200308061,74.9617920627326,80.2323192115695,88.18212284,88.8292903,82.78380612,80.64180019,74.34508171,79.131949,69.78928,73.31621257,73.31891299,66.93,83.5760244900262,81.23143,76.9773,76.44194,83.3955,70.42344,73.57485,73.22156,71.0093,81.96173,73.24131,74.37369,80.80792,75.85437,69.05459,88.22917,82.23055,63.10357,71.0093,73.33828,72.04624,88.73683,71.8097,71.56105,71.5,90.46408,74.37369,66.741,71.56105,72.56963,71.0498,72.21621,72.36443,70.64025,78.93507,77.30848,89.74316,81.82573,75.56979,73.09,73.01,90.807,29.3432842524841,-5.09647,-2.7,18.05281,18.76956,-1.90047,3.44433326426872,-4.11507,29.81296,-1.06297,15.26321,9.75923,15.487135,-14.047625,14.51383,39.3853251812875,2.310951,-12.40162,14.17784,29.435,-0.15,33.97785,6.92174,-1.63266,13.06592,15.252,31.12644,29.1192292549262,-7.6104,-15.37384,20.333698,36.09,29.15,76.6785072514293,-78.774901158062,102.22179,100.377094146977,101.55141,101.01648,99.0460799712137,98.90708,105.444469951627,101.379184000341,104.913503891591,99.2209776091293,101.212592794022,104.953184195294,99.2863399514276,100.773903425303,100.488349597619,102.94476,101.678586435316,98.32676,102.791547,93.2389,144.979936139441,30.551501,22.93384,96.2367899998586,74.2922699996607,26.072017,46.54593,51.3654043830059,62.0940299999845,30.458815,74.6046042530838,89.57354,144.8,79.53264,41.57257,144.921009,75.9382875627208,99.29083,123.402621511074,68.75,13.2689673869353,16.22499,27.6493378072939,-61.387168,158.213166,44.8264071840443,7.30478,76.951375383667,17.573,33.755513030402,7.42147,-86.229869,-57.5430988598245,-8.53355,30.0829552816609,-3.84623257927012,68.7872613147578,17.048]},"kind":"numeric","n":7124,"n_null":0,"n_unique":6713,"null_rate":0.0,"stats":{"iqr":47.41191455634363,"kurtosis":2.8589489248209734,"max":178.436748,"mean":62.801128012107284,"median":75.22975927090806,"min":-173.08406,"n_outliers":316,"outlier_rate":0.04435710275126333,"q1":40.81048094365637,"q3":88.2223955,"skew":-1.4023077478833694,"std":44.79069963149318,"zero_rate":0.0}},{"alerts":[],"column":"Latitude","extras":{"histogram":{"counts":[4,20,18,18,4,11,7,15,14,18,40,45,65,115,74,135,98,158,414,396,299,408,595,961,863,584,560,244,154,257,112,105,131,72,39,52,3,10,3,3],"edges":[-42.60931,-39.7481325,-36.886955,-34.025777500000004,-31.1646,-28.3034225,-25.442245,-22.5810675,-19.71989,-16.8587125,-13.997535,-11.136357499999999,-8.275179999999999,-5.414002500000002,-2.5528249999999986,0.30835250000000514,3.1695300000000017,6.030707499999998,8.891885000000002,11.753062500000006,14.614240000000002,17.4754175,20.336595000000003,23.197772500000006,26.058950000000003,28.9201275,31.781304999999996,34.64248250000001,37.50366,40.3648375,43.22601500000001,46.08719250000001,48.948370000000004,51.8095475,54.670725,57.53190250000001,60.393080000000005,63.2542575,66.11543500000002,68.97661250000002,71.83779]},"sample":[15.325456,32.85696,52.3452829999105,23.29746,14.3181900000685,-1.299822,14.89,50.853378,33.2966339932642,52.359881,23.6293422196677,39.95,51.545268,51.489102,25.1,40.4451667476472,43.300749,27.8764270003058,39.91,29.29423,48.917986,16.997694000078,28.0715390002247,31.958914,34.91654,37.878,47.924249,-11.8618595707626,13.834384,26.3356339999091,24.0819903246937,25.8755337589758,49.6414311289434,47.8789771210973,25.5502206093936,47.998066,35.502744,32.30991,43.272,41.8761475565644,43.21241,38.6102308659617,41.6952991856089,47.426358,42.453990918546,40.660934,41.808167,41.4,65.70591,40.492657,8.06266716076084,43.7354000002098,-25.754106,8.5,3.77198700019989,9.030075,5.609143,5.32,32.31795,35.79053,42.324101435233,51.9291778308922,48.202192384371,60.232544,47.383434,43.739982,38.50093,55.691546,3.15841,35.4495,38.5674900002633,38.09241,36.98774,35.91949,35.71479,37.312238,36.71347,5.62897,43.748566,49.77295,40.65921,45.05512,-23.6162827584425,40.8966,31.95667,14.0619989194383,43.51499,46.19303,10.95076,0.96896,-7.15128889,-15.0861366666666,-13.0060116666666,-4.1223,1.29,-4.59092,-4.758,-7.40148,4.41819,-1.68768,6.64615,-3.62170666273232,22.343582,-5.22120845760423,-3.15172,3.13217,6.56306,-7.95859597032779,3.96878701447147,3.94871,0.87401,-5.34184,15.55701,18.13807,-36.79,47.358721,26.7566263187496,25.3706406080776,19.19827,17.4054800165895,19.81283,19.229839,20.6311865472214,33.7956895251514,59.924808,23.33917,23.02309,22.7754966798279,21.8499790004305,25.6005,25.8036970003163,20.04497,18.9628452542051,22.29526,18.66322,23.81962,24.29844,22.003533,22.5,14.81146,14.2798,15.868106,18.2333333333333,20.005982,48.8750038873195,24.6325146697162,29.332654,38.743753,-27.51183,22.7405263472688,31.5330675384992,27.6174913214091,-36.754492,34.4672383059352,24.346528,50.70774,38.00406,51.4686,34.96106,-36.8916,22.453974,37.89,25.164,24.636329,28.0997600003237,25.2874113591469,23.2541533897105,-29.93794,17.3588049019042,10.8551010262113,7.01261516223599,12.8852712306571,19.8001025447867,12.5087291316441,34.2144873922675,27.2866128102296,27.9281443878621,21.3450421795165,20.6603665197542,27.4955856914852,21.0448081549979,18.9223070796146,15.1384495162956,27.5569419929166,33.8963314674007,31.8709995829228,26.3525997674092,19.9844767160874,33.9640765403269,25.4934673866915,32.6484318632325,25.3178892055831,22.7142358859654,20.2133358859063,10.367449482,31.3766856030303,31.1423196722175,34.4181614237725,17.117889881169,29.1065229032543,23.293611077175,27.3366984816026,19.8213486547934,25.7924617261605,16.3305373779314,23.729591,32.9542717523598,23.2348456335868,15.3097819093745,20.0846022821806,18.4598815714351,15.1262014951009,32.2984219075399,24.9447597509309,32.5665498284055,24.0378184695282,26.3837920177338,11.072996733517,26.7291191985397,21.7230585840524,19.380912,23.3796951397763,22.8733331448293,22.7980782995423,24.1947829853228,20.4743421003307,21.9985933018562,27.4577596841727,19.0572060641187,21.7921407015783,28.2773265429331,23.513259528931,21.2556115753012,24.9369955762187,26.3743569875058,25.2323907010373,28.4687513420224,22.3984895793198,19.69863882435,34.5020821462011,24.3728195648806,18.8673314354076,24.1348425894705,24.2197764646213,25.4947247974504,21.7312643892951,31.0124565863,22.6384372066401,30.4805232967313,31.382258081793,24.911427290752,28.345040980719,23.9384916092493,29.8206140415937,31.3778620101126,11.3734421305247,7.0131531199542,19.848311739432,20.0526783456071,20.0062006788874,13.4439206709671,22.638242946612,7.18516362429251,29.0324061298821,19.5742411870631,25.31335,23.5802229335952,24.7393105199291,21.3663035254886,22.1440948240442,19.9264104749748,30.0787131846638,34.1042304288506,28.8363752225835,21.8519681806441,22.5925008170738,11.2946063562399,30.3948136073396,30.8158445525794,23.2280984788687,28.5648695628,19.7722967560016,23.8914022404837,20.9779323794667,10.2078291542732,10.7342514006257,23.3231623729038,22.6572681033085,18.768266,21.5704195710411,22.809865945222,21.1353985927464,27.4018608680525,16.2941438867313,48.263024,60.190815,22.458119,-42.60931,27.47975,10.5474954687349,27.3902893242646,27.5429057599626,23.1002326248716,30.0825644662357,28.1521388989477,29.9404931369518,31.3521069742462,25.49062,28.8884608775018,32.4081096000141,32.1014354058548,23.8881174928165,32.9694596095775,19.0328851941692,27.2127287125889,21.9008972724133,17.0147708513735,22.3997523220159,29.3413896007001,31.7541200065016,30.0146067787175,27.8498578096613,24.5504126170675,25.5639793459062,8.95927166349667,30.5752609509616,28.46237,30.4723071801981,19.2700062410178,31.9285171055509,28.315271286651,24.4142715830119,23.2820664539269,31.4657062204324,24.77378,22.4486130924954,31.35169,23.540091,19.09299,19.088838,15.1213680772961,20.8157524489875,19.4531439710673,26.0521141370615,18.8169616015179,22.7307056066507,25.4587427111742,22.2454424870989,25.9098814435614,24.8326012227519,29.4775729302842,19.1589221072144,9.90669949332113,26.0736683118029,7.66774654752372,25.16802752,22.75085062,17.92154044,26.63243289,33.75650005,21.22778549,25.41303,31.38465505,31.38556234,24.99451,28.1970106025365,26.23141,30.66947,9.44314,27.57517,30.47182,29.40877,33.42657,30.07592,25.27631,31.35169,31.37244,25.87518,30.81091,26.86548,24.1716,21.03525,26.01814,30.07592,32.8442,30.48771,22.72786,34.9161,33.97674,34.7,24.10466,31.37244,30.16909,33.97674,35.25229,33.9405,36.17171,33.57134,32.90413,28.09479,30.22377,22.35544,28.09,31.20334,33.57,33.58,24.0112,15.7046659416403,11.58959,8.2426979652389,10.00271,10.25996,9.84855,11.8902242890197,10.24753,11.62269,8.84915,11.24528,10.15143,11.423668,13.390617,12.57452,-6.32807519071389,48.860069,15.16309,10.31267,-3.432,51.43,11.48506,16.7833,10.14498,8.34979,-4.22,11.94442,11.4061320433591,9.72582,16.71271,12.651219,9.06,12.0,32.4599252118963,42.9773834404934,23.46537,26.5063693415718,29.6523,22.04987,25.370726945692,24.70491,26.2414203622599,28.408954000127,27.4710580772684,23.9379097814113,26.3118026051061,26.3047780518656,24.1965705606828,27.4560759466476,34.5232483960148,23.10906,22.2550262980252,14.05959,24.959902,21.3151,43.5518951155671,50.41669,38.4759,52.4455700003552,41.7330799997422,44.450317,43.68536,35.6814805792653,32.3647769999586,50.414373,42.8877942903742,47.16752,-37.8,43.36512,41.01645,-37.680792,39.1533852146559,39.27552,41.8092369441296,38.53,-8.82347161502304,48.11967,53.8840081927239,15.296968,6.961764,41.6960550927683,50.81543,43.2952440539699,29.512,-13.916424353601,43.738215,12.11952,-25.3366360146404,38.54741,-1.97504000319361,40.3289012405997,38.6026810591835,-22.6]},"kind":"numeric","n":7124,"n_null":0,"n_unique":6696,"null_rate":0.0,"stats":{"iqr":16.055427913828673,"kurtosis":2.141333913013126,"max":71.83779,"mean":23.54423988192092,"median":25.021597596171,"min":-42.60931,"n_outliers":292,"outlier_rate":0.04098820887142055,"q1":15.554171055917974,"q3":31.60959896974665,"skew":-0.7020414184166529,"std":14.92328006174876,"zero_rate":0.0}},{"alerts":[],"column":"Ctry","extras":{"singletons":35,"top_values":[["India",2032],["Pakistan",767],["China",442],["Bangladesh",256],["Indonesia",234],["Nepal",184],["Sudan",168],["Laos",142],["Russia",115],["United States",90],["Iran",85],["Chad",81],["Malaysia",78],["Thailand",73],["Vietnam",69],["T\u00fcrkiye (Turkey)",61],["Myanmar (Burma)",59],["Afghanistan",58],["Sri Lanka",55],["Canada",52]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":202,"null_rate":0.0,"stats":{"cardinality":202,"entropy":5.058444860597964,"entropy_ratio":0.660525616456381,"top_rate":0.2852330151600225,"top_value":"India"}},{"alerts":[],"column":"IndigenousCode","extras":{"singletons":0,"top_values":[["Y",5657],["N",1467]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":2,"null_rate":0.0,"stats":{"cardinality":2,"entropy":0.7336183263753842,"entropy_ratio":0.7336183263753842,"top_rate":0.7940763615946098,"top_value":"Y"}},{"alerts":[{"code":"long_tail","level":"info","message":"467 singleton categories"}],"column":"PercentAdherents","extras":{"singletons":467,"top_values":[["0.000",4007],["1.000",285],["2.000",224],["3.000",166],["0.500",159],["5.000",137],["4.000",129],["0.200",96],["0.100",88],["0.300",77],["0.010",59],["1.500",54],["0.050",52],["0.400",47],["0.020",33],["1.200",30],["0.600",29],["0.009",25],["0.800",24],["0.090",22]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":692,"null_rate":0.0,"stats":{"cardinality":692,"entropy":4.045633501855261,"entropy_ratio":0.4288068808058004,"top_rate":0.5624649073554183,"top_value":"0.000"}},{"alerts":[],"column":"PercentChristianPC","extras":{"singletons":11,"top_values":[["0.482",869],["0.111",586],["0.000",374],["0.508",352],["8.571",311],["0.004",293],["5.023",169],["5.345",167],["3.733",151],["1.552",128],["0.008",127],["5.482",114],["27.052",111],["0.005",105],["1.495",90],["6.327",87],["0.731",86],["0.003",81],["0.001",79],["0.030",77]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":184,"null_rate":0.0,"stats":{"cardinality":184,"entropy":5.933585947355625,"entropy_ratio":0.7886671209743489,"top_rate":0.12198203256597417,"top_value":"0.482"}},{"alerts":[{"code":"one_word","level":"warn","message":"48.8% rows are a single word"},{"code":"duplicates","level":"warn","message":"34.0% duplicate strings"}],"column":"NaturalName","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[1,15,107,590,711,776,702,389,216,278,347,281,431,349,292,219,110,66,47,0,46,35,48,109,174,191,179,103,77,38,35,53,37,36,18,15,0,0,1,2],"edges":[1.0,1.95,2.9,3.8499999999999996,4.8,5.75,6.699999999999999,7.6499999999999995,8.6,9.549999999999999,10.5,11.45,12.399999999999999,13.35,14.299999999999999,15.25,16.2,17.15,18.099999999999998,19.05,20.0,20.95,21.9,22.849999999999998,23.799999999999997,24.75,25.7,26.65,27.599999999999998,28.549999999999997,29.5,30.45,31.4,32.349999999999994,33.3,34.25,35.199999999999996,36.15,37.1,38.05,39.0]},"near_unique":false,"sample":["Arab","Mansoori","Pa'a","Biafada","Ghosi (Hindu traditions)","Turk","Kandu","Tulai","Nigerian Fulani","Moroccan Arab","Walang","Nai (Hindu traditions)","Mulao Jia","Gulf-spoken Arab","Guibian Zhuang","Kulina Pano","Adyghe","Gulud","Deaf","Chunvalia","Dakpa","Nail Bedouin","English-speaking Jewish","Chechen","Darzi Mathuria (Muslim traditions)","Qaisrani Baloch","Ramdasia (Hindu traditions)","Jama Mapun","Hakka Chinese","Turk","Autrah Jat","Rajput Garewal (Muslim traditions)","Rajput Chauhan (Muslim traditions)","Bolodia","Badwa","Ho","Phuma","Khumra (Muslim traditions)","Kamboh (Hindu traditions)","Vaddar (Muslim traditions)","Arabized Temein","Southern Nasu","Baishi Miao","Naheng","Northern Uzbek","Meskhetian Turk","Western Punjabi","Bote-Majhi","Mountain Jewish","Zarma"],"top_values":[["Deaf",151],["Turk",38],["Persian",36],["Japanese",34],["South Asian",34],["Somali",27],["Northern Kurd",27],["Thai",27],["Moroccan Arab",25],["Sudanese Arab",23],["Nepali",23],["Urdu",23],["Malay",21],["Afghan",21],["Bosniak",20],["Punjabi",19],["Arabic-speaking Algerian",18],["Iraqi Arab",18],["Bengali-speaking South Asian",17],["Gujarati",17]],"top_words":[["traditions)",952],["(hindu",477],["(muslim",411],["pashtun",271],["arab",241],["jat",232],["rajput",207],["deaf",151],["brahmin",126],["jewish",121],["northern",77],["bania",74],["baloch",64],["berber",61],["south",61],["(sikh",61],["asian",58],["turk",58],["khel",52],["western",48],["tai",48],["southern",47],["thai",43],["malay",41],["persian",38]],"vocab_skipped":null,"word_histogram":{"counts":[3480,0,0,0,0,0,0,2403,0,0,0,0,0,0,0,980,0,0,0,0,0,0,253,0,0,0,0,0,0,8],"edges":[1.0,1.1333333333333333,1.2666666666666666,1.4,1.5333333333333332,1.6666666666666665,1.8,1.9333333333333333,2.0666666666666664,2.2,2.333333333333333,2.466666666666667,2.6,2.7333333333333334,2.8666666666666667,3.0,3.1333333333333333,3.2666666666666666,3.4,3.533333333333333,3.6666666666666665,3.8,3.933333333333333,4.066666666666666,4.2,4.333333333333334,4.466666666666667,4.6,4.733333333333333,4.866666666666667,5.0]}},"kind":"text","n":7124,"n_null":0,"n_unique":4705,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.3395564289724874,"emoji_rate":0.0,"len_max":39,"len_mean":11.84250421111735,"len_median":10.0,"len_min":1,"len_p95":27.0,"n_duplicates":2419,"n_empty":0,"one_word_rate":0.4884896125772038,"readability_flesch_mean":56.41992500000002,"url_rate":0.0,"vocab_size":4343,"word_mean":1.723469960696238,"word_median":2.0}},{"alerts":[{"code":"one_word","level":"warn","message":"72.7% rows are a single word"},{"code":"null_rate","level":"warn","message":"48.5% null"},{"code":"duplicates","level":"warn","message":"59.4% duplicate strings"}],"column":"NaturalPronunciation","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[1,251,136,47,112,595,517,143,181,392,243,123,83,121,114,104,137,112,59,48,46,29,17,20,15,7,4,2,1,6,1,1,0,0,0,1,1,0,0,2],"edges":[2.0,3.0,4.0,5.0,6.0,7.0,8.0,9.0,10.0,11.0,12.0,13.0,14.0,15.0,16.0,17.0,18.0,19.0,20.0,21.0,22.0,23.0,24.0,25.0,26.0,27.0,28.0,29.0,30.0,31.0,32.0,33.0,34.0,35.0,36.0,37.0,38.0,39.0,40.0,41.0,42.0]},"near_unique":false,"sample":["gulf AE-rub","pahsh-TOON yooz-ahf-SYE","KOO-kong","zah-RAH-moh","nay-PAH-lee","def","pahsh-TOON","uh-ZARE-ee","woh-row-doo-GOO","ee-ZAR-ghee-en BUR-bur","moo-sah-LEE","kan-DOO","BAHNG-kah","gulf AE-rub","muh-LAY","soh-MAH-lee","tee-HAH-mee AE-rub","bur-MEEZE","def","goo-jah-RAH-tee","BAHN-ten","leh-buh-NEEZ AE-rub","kare-uh-CHYE","ooz-BEH-kee AE-rub","jot DIH-lun","BOH-boh MAH-dah-ray","rain","too-NEE","soo-dun-EEZ AE-rub","def","TUH-kur","kuh-MAHN dung","oh-MAH-nee AE-rub","ben-GAH-lee","tie LOO","pahsh-TOON","terk","DAH-gee","Sher-pah","jahd","WOE-loff","tah-TAR","BAHNG-koo-loo","tah-TAR","mes-KEH-tee-un turk","def","yoy","CHAHK","lok","Jeeow-chung Chee-ung"],"top_values":[["def",151],["terk",38],["PUR-zhun",36],["kerd",35],["jae-puh-NEEZ",34],["pahsh-TOON",34],["AY-zhun",34],["tye",30],["soh-MAH-lee",27],["muh-LAY",27],["ee-RAH-kee AE-rub",26],["moh-RAH-kuhn AE-rub",25],["OOR-doo",24],["soo-dun-EEZ AE-rub",23],["nay-PAH-lee",23],["AHF-gahn",21],["YEH-meh-nee AE-rub",20],["BOZZ-nee-ak",20],["goo-jah-RAH-tee",19],["puhn-JAH-bee",19]],"top_words":[["ae-rub",239],["def",151],["joo",103],["rahj-put",50],["brah-min",49],["terk",45],["tye",41],["bur-bur",40],["pur-zhun",39],["pahsh-toon",37],["kerd",35],["ay-zhun",35],["jae-puh-neez",34],["muh-lay",33],["jot",30],["soh-mah-lee",28],["ee-rah-kee",26],["moh-rah-kuhn",25],["foo-lah-nee",25],["tah-tar",25],["tie",24],["oor-doo",24],["bahn-yah",24],["soo-dun-eez",23],["ahf-gahn",23]],"vocab_skipped":null,"word_histogram":{"counts":[2670,0,0,0,0,0,0,0,0,0,0,0,0,0,0,974,0,0,0,0,0,0,0,0,0,0,0,0,0,28],"edges":[1.0,1.0666666666666667,1.1333333333333333,1.2,1.2666666666666666,1.3333333333333333,1.4,1.4666666666666668,1.5333333333333332,1.6,1.6666666666666665,1.7333333333333334,1.8,1.8666666666666667,1.9333333333333333,2.0,2.0666666666666664,2.1333333333333333,2.2,2.2666666666666666,2.333333333333333,2.4,2.466666666666667,2.533333333333333,2.6,2.666666666666667,2.7333333333333334,2.8,2.8666666666666667,2.9333333333333336,3.0]}},"kind":"text","n":7124,"n_null":3452,"n_unique":1489,"null_rate":0.4845592363840539,"stats":{"allcaps_rate":0.0005446623093681918,"boilerplate_rate":0.0,"duplicate_rate":0.5944989106753813,"emoji_rate":0.0,"len_max":42,"len_mean":10.772875816993464,"len_median":10.0,"len_min":2,"len_p95":21.0,"n_duplicates":2183,"n_empty":0,"one_word_rate":0.7271241830065359,"readability_flesch_mean":69.92877500000003,"url_rate":0.0,"vocab_size":1537,"word_mean":1.2805010893246187,"word_median":1.0}},{"alerts":[],"column":"PercentChristianPGAC","extras":{"singletons":381,"top_values":[["0.000",3121],["3.733",151],["1.000",87],["2.000",79],["0.001",75],["0.006",69],["5.000",65],["3.000",59],["0.010",55],["4.000",55],["0.500",50],["0.002",46],["0.005",45],["0.030",45],["0.049",44],["0.100",39],["0.200",37],["1.592",37],["0.009",36],["1.771",36]]},"kind":"categorical","n":7124,"n_null":5,"n_unique":842,"null_rate":0.0007018528916339135,"stats":{"cardinality":842,"entropy":5.680944330058826,"entropy_ratio":0.5845990422745744,"top_rate":0.43840427026267736,"top_value":"0.000"}},{"alerts":[{"code":"long_tail","level":"info","message":"256 singleton categories"}],"column":"PercentEvangelical","extras":{"singletons":256,"top_values":[["0.000",4195],["0.100",171],["0.200",154],["0.500",135],["1.000",133],["0.300",108],["2.000",92],["0.400",71],["0.050",60],["0.010",60],["0.800",46],["1.500",40],["0.900",38],["0.600",35],["0.030",32],["0.700",29],["0.020",27],["0.080",25],["0.001",25],["0.006",24]]},"kind":"categorical","n":7124,"n_null":741,"n_unique":401,"null_rate":0.10401459854014598,"stats":{"cardinality":401,"entropy":3.1457049012367606,"entropy_ratio":0.36377219133117733,"top_rate":0.6572144759517469,"top_value":"0.000"}},{"alerts":[],"column":"PercentEvangelicalPC","extras":{"singletons":11,"top_values":[["0.199",869],["0.095",586],["0.000",441],["0.247",352],["0.004",315],["3.409",311],["3.339",169],["2.656",167],["0.003",151],["0.001",131],["0.866",128],["1.699",114],["0.472",111],["0.028",96],["1.315",90],["1.509",87],["0.439",86],["0.036",78],["0.012",77],["0.197",76]]},"kind":"categorical","n":7124,"n_null":153,"n_unique":166,"null_rate":0.021476698483997754,"stats":{"cardinality":166,"entropy":5.777065807145899,"entropy_ratio":0.7833267687479762,"top_rate":0.1246593028259934,"top_value":"0.199"}},{"alerts":[],"column":"PercentEvangelicalPGAC","extras":{"singletons":215,"top_values":[["0.000",3264],["1.801",151],["0.002",98],["0.001",93],["0.006",68],["0.004",66],["1.000",59],["0.016",58],["0.200",42],["0.010",42],["0.100",41],["0.005",41],["0.049",40],["0.500",37],["0.104",37],["0.074",36],["2.000",36],["1.543",36],["0.007",35],["0.003",34]]},"kind":"categorical","n":7124,"n_null":450,"n_unique":548,"null_rate":0.06316676024705221,"stats":{"cardinality":548,"entropy":4.971917523537102,"entropy_ratio":0.5464827424437071,"top_rate":0.4890620317650584,"top_value":"0.000"}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=+3.48"},{"code":"outliers","level":"warn","message":"17.0% rows beyond 1.5 IQR"}],"column":"PCBuddhism","extras":{"histogram":{"counts":[6435,27,19,7,25,3,13,3,14,4,6,3,21,5,9,3,22,4,2,5,4,3,10,10,16,3,9,24,18,7,6,12,14,8,13,20,29,9,76,179],"edges":[0.0,2.5,5.0,7.5,10.0,12.5,15.0,17.5,20.0,22.5,25.0,27.5,30.0,32.5,35.0,37.5,40.0,42.5,45.0,47.5,50.0,52.5,55.0,57.5,60.0,62.5,65.0,67.5,70.0,72.5,75.0,77.5,80.0,82.5,85.0,87.5,90.0,92.5,95.0,97.5,100.0]},"sample":[0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,40.0,70.0,70.5,97.0,1.0,0.0,92.7,0.0,8.0,40.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,7.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,40.0,30.0,96.5,95.0,20.0,98.7999999970198,99.0,0.0,0.0,0.0,0.0,0.0,98.0,10.0,75.0,0.0,0.0,0.0,0.0,0.0,0.0,75.0,0.0,0.0,0.0,100.0,10.0,40.0,0.0,0.0,0.0,0.0,42.072556264696,0.0,0.0,100.0,0.0,0.217206185439781,0.0,0.0,0.0,0.0,0.0,0.0141040408076914,4.05497198969985,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0534850506344738,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.042713567839196,0.23826332509707,100.0,0.0,0.045004500450045,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.286615075952995,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00241542476452197,74.3077621425329,0.0,0.0,0.0,0.0,0.0,0.0,1.40700008589453,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0463311519082643,0.00759013282732448,0.0,0.0,0.434380490136727,0.0,0.0,0.0574003386619981,0.141634493241774,63.5724512082163,0.0,0.00564354937001107,0.0,0.0015364575775527,0.193704996281191,0.0,0.0,0.0,0.00905776590204026,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.579386617021186,0.0326131810497451,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.187989584881564,0.00573341389514909,0.0324191143097971,0.0,0.0,0.0,0.347721266632667,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00186066216672678,0.00320738982615947,100.0,0.0,0.0,0.0,100.0,0.0,0.0,20.0,3.0,0.0,0.0,0.0,99.9,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00937717414319852,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.53301747112822,0.0,0.0,0.0,0.0,1.37741046831956,0.0,0.0,96.1154572430537,0.0,0.0,0.0,0.00921680223046614,0.0,0.124006398730174,0.0,0.0,0.0,0.0,0.0,0.0414340544312631,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0606838497376282,0.072805091118602,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,98.0,100.0,98.3532934131736,54.99,0.0,60.0,0.0,0.0,0.0,100.0,0.0,0.0,0.0,70.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,85.0,0.0,0.0,0.0,0.0,65.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0]},"kind":"numeric","n":7124,"n_null":24,"n_unique":809,"null_rate":0.003368893879842785,"stats":{"iqr":0.0,"kurtosis":10.558689432677838,"max":100.0,"mean":6.41072627084623,"median":0.0,"min":0.0,"n_outliers":1208,"outlier_rate":0.17014084507042254,"q1":0.0,"q3":0.0,"skew":3.475117961353116,"std":22.390570471082555,"zero_rate":0.8298591549295775}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=+2.16"},{"code":"outliers","level":"warn","message":"22.0% rows beyond 1.5 IQR"}],"column":"PCEthnicReligions","extras":{"histogram":{"counts":[5603,76,108,48,71,15,30,20,45,11,27,14,42,4,15,9,23,1,13,5,7,5,6,10,21,3,26,12,30,3,8,16,40,18,44,18,56,57,223,323],"edges":[0.0,2.5,5.0,7.5,10.0,12.5,15.0,17.5,20.0,22.5,25.0,27.5,30.0,32.5,35.0,37.5,40.0,42.5,45.0,47.5,50.0,52.5,55.0,57.5,60.0,62.5,65.0,67.5,70.0,72.5,75.0,77.5,80.0,82.5,85.0,87.5,90.0,92.5,95.0,97.5,100.0]},"sample":[0.0,0.0,0.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,7.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,62.0,0.0,0.0,0.0,43.0,0.0,2.0,95.0,48.0,29.9,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,98.3846153846154,0.0,0.0,0.0,15.0,10.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,0.0,0.0,65.0,69.5,79.958,80.0,100.0,90.0,85.0,85.0,100.0,100.0,97.0,98.1,99.0,100.0,100.0,96.0,100.0,0.0,0.0,0.0,0.0,100.0,0.0,0.0,66.0,14.0,0.0,0.0,0.0,96.6538461538462,0.0,0.0,0.0,0.0,0.0,95.0,60.0,0.0,0.0,20.0,0.9,0.0,100.0,70.0,100.0,97.9981983785407,98.75,0.0,89.8148927219184,25.0,96.0,94.8,95.0,98.0,96.3000030517578,95.0,21.5,99.0,94.8,80.0,100.0,59.9,59.7,100.0,70.0,100.0,30.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,6.0,13.9998392670578,23.0,1.0,30.0,0.0,0.0,0.0,4.8,23.0,0.0,7.0,7.0,30.0,20.0,76.0,0.0,5.0,0.0,0.0,0.0,0.0,0.0,95.0,10.0,0.0,33.0,0.0,10.0,4.0,30.0,0.0,25.0,0.0,0.0,1.6,10.0,96.0,97.9,95.0,95.0,97.0,96.9,95.0,95.5,0.0,93.9,30.0,98.0,94.0,94.0,95.0,0.0,95.0,100.0,0.0,3.0,0.0,0.0,86.0,0.0,97.0,0.0,95.0,0.0,0.0,5.0,96.0,0.0,0.0,0.0,10.0,50.0,31.8,45.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0]},"kind":"numeric","n":7124,"n_null":18,"n_unique":351,"null_rate":0.0025266704098820887,"stats":{"iqr":0.0,"kurtosis":2.8849826867427923,"max":100.0,"mean":13.109499979504518,"median":0.0,"min":0.0,"n_outliers":1560,"outlier_rate":0.2195327891922319,"q1":0.0,"q3":0.0,"skew":2.1552873886971153,"std":30.744009593510953,"zero_rate":0.780467210807768}},{"alerts":[],"column":"PCHinduism","extras":{"histogram":{"counts":[4856,10,14,2,9,6,7,3,10,8,4,4,5,6,2,2,4,5,0,3,6,1,8,4,7,1,8,7,12,5,5,9,9,12,11,20,23,31,117,1844],"edges":[0.0,2.5,5.0,7.5,10.0,12.5,15.0,17.5,20.0,22.5,25.0,27.5,30.0,32.5,35.0,37.5,40.0,42.5,45.0,47.5,50.0,52.5,55.0,57.5,60.0,62.5,65.0,67.5,70.0,72.5,75.0,77.5,80.0,82.5,85.0,87.5,90.0,92.5,95.0,97.5,100.0]},"sample":[0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,6.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,57.927443735304,23.0,0.0,0.0,99.431873846807,100.0,98.579520912266,91.0,99.9317126468178,0.0,0.0,100.0,15.0,98.0,95.5990952032466,83.2748455290979,93.0,0.0,0.0,27.0,34.0,95.046768707483,0.0,97.0,0.0,0.0,100.0,100.0,100.0,99.9733391098595,0.0,100.0,99.8766666666667,99.9357142857143,98.9992301770593,100.0,100.0,23.1018518518519,99.5815730835543,100.0,100.0,100.0,100.0,100.0,99.9414551067114,100.0,99.9972032274755,99.7879574082814,100.0,0.0,100.0,99.9833387903754,98.0188600430109,100.0,100.0,99.6954865041532,99.2661489888216,100.0,99.5065974836246,99.6583241961974,100.0,100.0,0.0,78.4784784784785,98.8746681459761,100.0,98.5526615630023,100.0,99.9098720182659,99.2107662584207,100.0,100.0,99.8876709123964,100.0,99.9855397383054,99.957599640844,95.535077663901,100.0,100.0,99.9034282955094,99.3253981351184,100.0,100.0,100.0,96.0691642651297,99.9948333763885,99.2161182816551,99.6249531191399,0.0,0.0,88.195991091314,62.1945803566643,99.9995028590267,99.8708492380105,96.6,100.0,99.0465075990658,100.0,100.0,99.9891878911209,95.940147124387,0.0,0.0,0.0,99.6119402985075,0.0,0.0,97.2222222222222,0.0,0.0,0.0,0.0,0.0,0.0,0.0,99.631424,100.0,100.0,100.0,99.8137601935824,0.0,0.0,0.0,99.3527050977137,100.0,100.0,100.0,98.8279841327083,99.6837509882782,100.0,99.4947532063739,100.0,100.0,99.8964113947466,100.0,97.2884386174017,0.0,0.0,0.0,100.0,0.0,100.0,0.0,98.9719181342218,100.0,99.8566820135396,0.0,100.0,97.4907484260545,97.1999486817628,96.1689587426326,99.6923076923077,0.0,14.6341463414634,55.0,29.0,96.0,66.0,73.0,100.0,0.0,0.0,100.0,72.1983725680608,100.0,0.0,0.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,99.9962552591581,0.0,0.0,0.0,100.0,94.542803582587,100.0,100.0,100.0,0.0,0.0,0.0,100.0,100.0,100.0,100.0,100.0,100.0,0.0,0.0,0.0,97.6115237904035,92.4652694610779,93.823248855618,100.0,100.0,100.0,0.0,99.4385492111616,100.0,100.0,99.4669825288718,100.0,100.0,100.0,99.9873856164492,100.0,100.0,0.0,99.9398145999629,0.0,97.0503705944638,100.0,0.0,99.7381546134663,98.3425414364641,0.0,0.0,0.0,0.0,99.835092348285,99.1517128874388,100.0,100.0,0.0,0.0,0.0,0.0,99.9383976207446,99.8992419098696,0.0,0.0,100.0,0.0,0.0,0.0,100.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,99.2996201329535,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0]},"kind":"numeric","n":7124,"n_null":24,"n_unique":1131,"null_rate":0.003368893879842785,"stats":{"iqr":98.41721788343582,"kurtosis":-1.2156844350319316,"max":100.0,"mean":29.820105515783194,"median":0.0,"min":0.0,"n_outliers":0,"outlier_rate":0.0,"q1":0.0,"q3":98.41721788343582,"skew":0.872070203375224,"std":44.98014167522683,"zero_rate":0.6767605633802817}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=+7.39"},{"code":"outliers","level":"warn","message":"12.0% rows beyond 1.5 IQR"}],"column":"PCOtherSmall","extras":{"histogram":{"counts":[6854,30,24,11,12,5,4,4,1,21,2,3,4,0,1,3,3,0,0,0,0,0,3,2,3,0,0,3,3,0,1,0,2,2,2,0,2,0,2,93],"edges":[0.0,2.5,5.0,7.5,10.0,12.5,15.0,17.5,20.0,22.5,25.0,27.5,30.0,32.5,35.0,37.5,40.0,42.5,45.0,47.5,50.0,52.5,55.0,57.5,60.0,62.5,65.0,67.5,70.0,72.5,75.0,77.5,80.0,82.5,85.0,87.5,90.0,92.5,95.0,97.5,100.0]},"sample":[0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,2.1,2.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,25.0,24.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.9,0.0,0.0,0.0,0.0,0.0,0.9,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.321366653981141,0.01724686902993,0.0,0.0123412605363512,0.0,0.0682873531821907,0.0,0.0,0.0,71.25,0.0,0.0,0.0492309911169264,2.0,0.0,0.0,70.8,41.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0769822940723634,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0195149644295421,0.0,0.00279677252450672,0.0209694084829908,0.0,0.0,0.0,0.0,0.0234186895779513,0.0,0.0,0.0167402707140921,0.0,0.0,0.0432769680877441,0.000454961123571991,0.0,0.0,0.0,1.73506840173507,0.0118873083171534,0.0,0.0215561043808163,0.0,0.0,0.0120698441649009,0.0,0.0,0.00814454211821502,0.0,0.0,0.0174589714171697,0.00875946508866525,0.0,0.0,0.0,0.0439066299011151,0.0,0.0,0.0,0.0,0.0,0.466504341830248,0.0,0.0,0.0,0.0,0.0103369857349597,0.000124285243333417,0.0,0.16,0.0,0.0,0.0,0.0,0.00216242177581491,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0131959716820199,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.028723070148997,0.0,0.0,0.0,0.0,0.0,0.0,0.0291488534784299,0.0,0.0,0.103588605253422,0.0,2.26460071513707,100.0,99.4684172818978,100.0,0.0,0.0,0.0,100.0,0.0,0.0,0.00682105699705543,0.0,0.0,0.0166727679331929,0.0256591186092758,0.0,0.0,0.0,0.0,2.5,0.0,0.0,0.0,3.0,0.0,0.0,0.0,0.0,27.8016274319392,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00374474084190585,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00301144348524393,0.0,0.000410099268628964,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.000725125301652125,0.0,0.0453789139313266,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.848287112561175,0.0,0.0,0.0,100.0,0.0,0.0,0.0350899628670215,0.0297694357203459,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.106837606837607,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0]},"kind":"numeric","n":7124,"n_null":24,"n_unique":670,"null_rate":0.003368893879842785,"stats":{"iqr":0.0,"kurtosis":54.18248726406884,"max":100.0,"mean":1.8357846756141856,"median":0.0,"min":0.0,"n_outliers":851,"outlier_rate":0.11985915492957747,"q1":0.0,"q3":0.0,"skew":7.389811652192254,"std":12.333801116249889,"zero_rate":0.8801408450704226}},{"alerts":[{"code":"outliers","level":"warn","message":"8.4% rows beyond 1.5 IQR"}],"column":"RegionCode","extras":{"histogram":{"counts":[75,0,0,726,0,0,0,521,0,0,3349,0,0,0,352,0,0,0,444,0,0,373,0,0,0,460,0,0,0,223,0,0,320,0,0,0,121,0,0,160],"edges":[1.0,1.275,1.55,1.8250000000000002,2.1,2.375,2.6500000000000004,2.9250000000000003,3.2,3.475,3.75,4.025,4.300000000000001,4.575,4.8500000000000005,5.125,5.4,5.675000000000001,5.95,6.2250000000000005,6.5,6.775,7.050000000000001,7.325,7.6000000000000005,7.875000000000001,8.15,8.425,8.700000000000001,8.975000000000001,9.25,9.525,9.8,10.075000000000001,10.350000000000001,10.625,10.9,11.175,11.450000000000001,11.725000000000001,12.0]},"sample":[6.0,6.0,10.0,6.0,7.0,7.0,8.0,10.0,6.0,10.0,6.0,5.0,10.0,10.0,6.0,10.0,10.0,6.0,5.0,6.0,10.0,6.0,6.0,6.0,6.0,5.0,3.0,11.0,2.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,6.0,9.0,10.0,9.0,12.0,5.0,9.0,5.0,9.0,9.0,5.0,9.0,5.0,7.0,12.0,7.0,7.0,7.0,7.0,7.0,7.0,5.0,5.0,5.0,10.0,10.0,10.0,10.0,12.0,5.0,10.0,2.0,5.0,5.0,5.0,5.0,4.0,5.0,5.0,5.0,11.0,10.0,10.0,12.0,12.0,11.0,12.0,6.0,2.0,9.0,10.0,11.0,11.0,11.0,11.0,11.0,11.0,11.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,3.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,10.0,3.0,3.0,2.0,2.0,2.0,2.0,2.0,12.0,10.0,3.0,3.0,3.0,3.0,3.0,3.0,2.0,2.0,2.0,2.0,3.0,3.0,3.0,2.0,2.0,2.0,2.0,2.0,2.0,10.0,6.0,4.0,10.0,7.0,4.0,4.0,4.0,1.0,4.0,4.0,10.0,10.0,10.0,5.0,1.0,4.0,5.0,6.0,6.0,4.0,6.0,4.0,7.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,10.0,10.0,3.0,1.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,7.0,8.0,8.0,8.0,8.0,8.0,8.0,8.0,7.0,8.0,8.0,8.0,8.0,8.0,8.0,7.0,10.0,8.0,8.0,7.0,10.0,7.0,8.0,8.0,8.0,8.0,7.0,7.0,8.0,8.0,8.0,7.0,7.0,4.0,12.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,2.0,2.0,3.0,2.0,3.0,9.0,9.0,9.0,5.0,9.0,9.0,5.0,5.0,9.0,5.0,3.0,1.0,5.0,5.0,1.0,3.0,3.0,3.0,5.0,7.0,10.0,9.0,12.0,1.0,9.0,10.0,5.0,6.0,7.0,10.0,11.0,11.0,10.0,7.0,10.0,5.0,7.0]},"kind":"numeric","n":7124,"n_null":0,"n_unique":12,"null_rate":0.0,"stats":{"iqr":2.0,"kurtosis":0.577531118681248,"max":12.0,"mean":5.005474452554744,"median":4.0,"min":1.0,"n_outliers":601,"outlier_rate":0.08436271757439641,"q1":4.0,"q3":6.0,"skew":1.121537933130152,"std":2.4571802971749355,"zero_rate":0.0}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=+25.48"},{"code":"outliers","level":"warn","message":"17.8% rows beyond 1.5 IQR"}],"column":"PopulationPGAC","extras":{"histogram":{"counts":[6626,327,104,9,0,51,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2],"edges":[10.0,23128254.75,46256499.5,69384744.25,92512989.0,115641233.75,138769478.5,161897723.25,185025968.0,208154212.75,231282457.5,254410702.25,277538947.0,300667191.75,323795436.5,346923681.25,370051926.0,393180170.75,416308415.5,439436660.25,462564905.0,485693149.75,508821394.5,531949639.25,555077884.0,578206128.75,601334373.5,624462618.25,647590863.0,670719107.75,693847352.5,716975597.25,740103842.0,763232086.75,786360331.5,809488576.25,832616821.0,855745065.75,878873310.5,902001555.25,925129800.0]},"sample":[3096000.0,38179700.0,38179700.0,706000.0,43000.0,6063000.0,2734000.0,22449700.0,22449700.0,22449700.0,4909100.0,4909100.0,2816900.0,81200.0,31513800.0,31513800.0,208200.0,533000.0,19960100.0,3682000.0,3682000.0,3296000.0,34400.0,12119600.0,97000.0,670000.0,182500.0,119686000.0,119686000.0,297000.0,17000.0,2500.0,2656900.0,51000.0,42000.0,13000.0,2500.0,458000.0,1009000.0,3139000.0,3139000.0,3139000.0,13000.0,188700.0,896600.0,2800.0,53000.0,155400.0,1900.0,10700.0,117100.0,28900200.0,28900200.0,214000.0,1944000.0,2900.0,52000.0,2459000.0,80000.0,209000.0,3785400.0,16544400.0,16544400.0,16544400.0,16544400.0,16544400.0,160700.0,6800.0,48380900.0,48380900.0,11000.0,12386800.0,759600.0,9100.0,139000.0,26000.0,811900.0,811900.0,34200.0,525700.0,145700.0,808900.0,3200.0,96600.0,43600.0,43000.0,100.0,1600.0,19000.0,21000.0,200.0,300.0,200.0,100.0,16000.0,9000.0,95000.0,78000.0,607300.0,29000.0,9548000.0,96000.0,172000.0,18869300.0,700.0,240000.0,258100.0,700.0,500.0,65000.0,597000.0,35000.0,600.0,900.0,33000.0,24364900.0,24364900.0,9600.0,63000.0,1600.0,1064000.0,27800.0,719000.0,700.0,40000.0,19067500.0,14000.0,23800.0,1400.0,324000.0,1105800.0,24000.0,490000.0,1178000.0,200.0,1400.0,200.0,400.0,1309000.0,66000.0,115000.0,80000.0,900.0,13000.0,5500.0,1100.0,3800.0,900.0,5091400.0,5091400.0,68000.0,2917000.0,2917000.0,2795500.0,216200.0,216200.0,216200.0,23000.0,130300.0,1700100.0,1550700.0,501900.0,528700.0,714500.0,9558900.0,2064400.0,2064400.0,2064400.0,5400.0,99000.0,2927200.0,2927200.0,211000.0,1700.0,59282900.0,15900000.0,6700.0,2521000.0,6318000.0,3500.0,695900.0,231000.0,1433000.0,9400.0,47300.0,2000.0,49030100.0,60800.0,13000.0,6100.0,2300.0,4300.0,154000.0,421800.0,58000.0,236700.0,8700.0,1900.0,117600.0,138000.0,1300.0,1567000.0,2100.0,15000.0,1400.0,1200.0,139000.0,11000.0,1620000.0,77000.0,1500.0,179000.0,29000.0,9000.0,1185000.0,20000.0,5930000.0,20000.0,217500.0,174000.0,4200.0,122000.0,8522000.0,30700.0,592000.0,10000.0,78000.0,773000.0,6100.0,2389000.0,717000.0,9000.0,195000.0,1900.0,16585800.0,2100.0,62000.0,677000.0,1400.0,7973000.0,9628000.0,319000.0,140000.0,140000.0,117000.0,4560000.0,241000.0,1527000.0,197600.0,788200.0,211000.0,881100.0,1276000.0,15000.0,7826000.0,2186000.0,560000.0,183000.0,23600.0,50000.0,16300.0,154000.0,170000.0,12388000.0,6132000.0,842000.0,2900.0,148000.0,148000.0,68000.0,3100.0,38000.0,2326000.0,124600.0,262000.0,81000.0,63000.0,8900.0,881500.0,37000.0,106000.0,93000.0,40000.0,6700.0,1300.0,1300.0,71000.0,5268000.0,61000.0,10723800.0,5800.0,1400.0,1100.0,558000.0,1800.0,16300.0,16300.0,51200.0,10781900.0,10781900.0,10781900.0,10781900.0,10781900.0,13000.0,1273200.0,20800.0,327300.0,82000.0,122000.0,279500.0,110000.0,492000.0,61000.0,330000.0,241900.0,406400.0,54000.0,568000.0,129000.0,198000.0,54000.0,2751000.0,351000.0,256300.0,46000.0,78000.0,107000.0,43000.0,48000.0,76000.0,237500.0,216000.0,57400.0,39000.0,1353700.0,50000.0,600000.0,70000.0,13000.0,2000.0,900.0,504000.0,163000.0,1232000.0,110000.0,1700.0,141700.0,49000.0,1100.0,3400.0,6100.0,68000.0,35000.0,534000.0,594000.0,299000.0,8500.0,243000.0,10000.0,1900.0,57200.0,57200.0,24000.0,88000.0,153100.0,1900.0,196000.0,460000.0,67000.0,45200.0,8312000.0,3900.0,54000.0,30000.0,174000.0,153000.0,126000.0,103000.0,150000.0,1350000.0,34000.0,38000.0,26800.0,907000.0,823000.0,541000.0,682100.0,18000.0,95000.0,31000.0,57000.0,182000.0,673000.0,7800.0,195000.0,132000.0,23000.0,10000.0,49000.0,38000.0,212000.0,494000.0,129000.0,927000.0,71900.0,27700.0,31000.0,5078900.0,1800.0,13000.0,27000.0,135696800.0,33000.0,113600.0,36800.0,177400.0,12200.0,85000.0,487900.0,18000.0,213000.0,41000.0,9373000.0,5600.0,2419300.0,4610000.0,139000.0,118000.0,3359200.0,3359200.0,1196000.0,1196000.0,1196000.0,132000.0,160600.0,2150500.0,8000.0,7106600.0,102000.0,100000.0,20300.0,257700.0,3700.0,2300.0,15000.0,1104400.0,1104400.0,14000.0,16000.0,11000.0,1600.0,48000.0,100000.0,1600.0,33000.0,85000.0,300.0,6500.0,5900.0,244000.0,4600.0,843000.0,15700.0,15700.0,461000.0,2900.0,31000.0,13300.0,9228800.0,17966900.0,17966900.0,6063100.0,111400.0,111400.0,342400.0,5725900.0,5725900.0,342300.0,12284400.0,12284400.0,12284400.0,66822900.0,2800.0,74000.0,56000.0,18627800.0,27508450.0,27508450.0,27508450.0,27508450.0,27508450.0,27508450.0,27508450.0,27508450.0,27508450.0,27508450.0,27508450.0,27508450.0,27508450.0,27508450.0]},"kind":"numeric","n":7124,"n_null":5,"n_unique":1509,"null_rate":0.0007018528916339135,"stats":{"iqr":1414600.0,"kurtosis":1051.5454118766831,"max":925129800.0,"mean":4880603.574940301,"median":130300.0,"min":10.0,"n_outliers":1264,"outlier_rate":0.17755302711054924,"q1":20000.0,"q3":1434600.0,"skew":25.484786527825804,"std":20949338.00151076,"zero_rate":0.0}},{"alerts":[],"column":"Frontier","extras":{"singletons":0,"top_values":[["Y",4767],["N",2357]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":2,"null_rate":0.0,"stats":{"cardinality":2,"entropy":0.9157959662837094,"entropy_ratio":0.9157959662837094,"top_rate":0.6691465468837732,"top_value":"Y"}},{"alerts":[{"code":"one_word","level":"warn","message":"100.0% rows are a single word"},{"code":"short_text","level":"info","message":"95th-percentile length under 20 chars"},{"code":"duplicates","level":"warn","message":"35.2% duplicate strings"}],"column":"MapAddress","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[1500,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3833,0,0,0,0,0,0,0,0,1791],"edges":[0.0,0.325,0.65,0.9750000000000001,1.3,1.625,1.9500000000000002,2.275,2.6,2.9250000000000003,3.25,3.575,3.9000000000000004,4.2250000000000005,4.55,4.875,5.2,5.525,5.8500000000000005,6.175,6.5,6.825,7.15,7.4750000000000005,7.800000000000001,8.125,8.450000000000001,8.775,9.1,9.425,9.75,10.075000000000001,10.4,10.725,11.05,11.375,11.700000000000001,12.025,12.35,12.675,13.0]},"near_unique":false,"sample":["m10375.png","m21769.png","m14244_ni.png","m10824_pu.png","m16828.png","","m17080.png","","m10949_cm.png","m13819_no.png","m19198.png","m17745.png","m18615_ch.png","m00007.png","m19808.png","","","m11988_su.png","","m16620.png","m11478.png","m13922_ag.png","","","m21128.png","m22047.png","m17937.png","m10584_rp.png","","m18274_tu.png","m20032.png","m20236.png","m20235.png","m16501.png","m16278.png","m16944.png","","m17590.png","m17067.png","m17721.png","m00005.png","m18628_ch.png","","m18617.png","","","","m16514.png","m10839_aj.png","m16100_bn.png"],"top_values":[["",1500],["m00328.png",40],["m00007.png",33],["m00077.png",19],["m00040.png",14],["m00005.png",13],["m00079.png",13],["m14256.png",13],["m00081.png",12],["m00068.png",10],["m00273.png",10],["m00034.png",8],["m14322.png",8],["m00305.png",8],["m18084.png",8],["m00033.png",7],["m00028.png",7],["m00009.png",6],["m00042.png",6],["m11359.png",6]],"top_words":[["m00328.png",40],["m00007.png",33],["m00077.png",19],["m00040.png",14],["m00005.png",13],["m00079.png",13],["m14256.png",13],["m00081.png",12],["m00068.png",10],["m00273.png",10],["m00034.png",8],["m14322.png",8],["m00305.png",8],["m18084.png",8],["m00033.png",7],["m00028.png",7],["m00009.png",6],["m00042.png",6],["m11359.png",6],["m16318.png",6],["m00015.png",5],["m00306.png",5],["m00334.png",5],["m16187.png",5],["m16521.png",5]],"vocab_skipped":null,"word_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,7124,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[0.5,0.5333333333333333,0.5666666666666667,0.6,0.6333333333333333,0.6666666666666666,0.7,0.7333333333333334,0.7666666666666666,0.8,0.8333333333333333,0.8666666666666667,0.9,0.9333333333333333,0.9666666666666667,1.0,1.0333333333333332,1.0666666666666667,1.1,1.1333333333333333,1.1666666666666665,1.2,1.2333333333333334,1.2666666666666666,1.3,1.3333333333333335,1.3666666666666667,1.4,1.4333333333333333,1.4666666666666668,1.5]}},"kind":"text","n":7124,"n_null":0,"n_unique":4616,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.352049410443571,"emoji_rate":0.0,"len_max":13,"len_mean":8.648652442448062,"len_median":10.0,"len_min":0,"len_p95":13.0,"n_duplicates":2508,"n_empty":1500,"one_word_rate":1.0,"readability_flesch_mean":17.622400000000027,"url_rate":0.0,"vocab_size":4615,"word_mean":1.0,"word_median":1.0}},{"alerts":[],"column":"HasJesusFilm","extras":{"singletons":0,"top_values":[["Y",5610],["N",1514]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":2,"null_rate":0.0,"stats":{"cardinality":2,"entropy":0.7462740906620023,"entropy_ratio":0.7462740906620023,"top_rate":0.787478944413251,"top_value":"Y"}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 96.6% of rows"}],"column":"Nomadic","extras":{"singletons":0,"top_values":[["N",6884],["Y",240]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":2,"null_rate":0.0,"stats":{"cardinality":2,"entropy":0.21256700366888365,"entropy_ratio":0.21256700366888365,"top_rate":0.9663110612015722,"top_value":"N"}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.6% null"}],"column":"NomadicTypeDescription","extras":{"singletons":2,"top_values":[["Agro-Pastoralists",184],["Service or Trade",30],["Agro-Pastoralists, Service or Trade",16],["Hunter-Gatherers",8],["Agro-Pastoralists, Hunter-Gatherers",1],["Service or Trade, Hunter-Gatherers",1]]},"kind":"categorical","n":7124,"n_null":6884,"n_unique":6,"null_rate":0.9663110612015722,"stats":{"cardinality":6,"entropy":1.1587984381804104,"entropy_ratio":0.4482844288290942,"top_rate":0.7666666666666667,"top_value":"Agro-Pastoralists"}},{"alerts":[],"column":"PhotoCCVersionText","extras":{"singletons":1,"top_values":[["",5688],["CC BY 2.0",387],["CC BY-SA 4.0",246],["CC BY-SA 2.0",193],["CC BY-NC-SA 2.0",151],["CC BY-SA 3.0",143],["CC0 1.0",127],["CC BY-NC 2.0",111],["CC BY 3.0",27],["CC BY-NC-ND 2.0",18],["CC BY 4.0",14],["CC SA 1.0",7],["CC BY-ND 2.0",5],["CC BY 3.0 BR",4],["CC BY-SA 2.5",2],["CC BY-NC-SA 4.0",1]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":16,"null_rate":0.0,"stats":{"cardinality":16,"entropy":1.3227594126157038,"entropy_ratio":0.33068985315392596,"top_rate":0.79842784952274,"top_value":""}},{"alerts":[],"column":"PhotoCCVersionURL","extras":{"singletons":1,"top_values":[["",5688],["https://creativecommons.org/licenses/by/2.0/",387],["https://creativecommons.org/licenses/by-sa/4.0/",246],["https://creativecommons.org/licenses/by-sa/2.0/",193],["https://creativecommons.org/licenses/by-nc-sa/2.0/",151],["https://creativecommons.org/licenses/by-sa/3.0/",143],["https://creativecommons.org/publicdomain/zero/1.0/",127],["https://creativecommons.org/licenses/by-nc/2.0/",111],["https://creativecommons.org/licenses/by/3.0/",27],["https://creativecommons.org/licenses/by-nc-nd/2.0/",18],["https://creativecommons.org/licenses/by/4.0/",14],["https://creativecommons.org/licenses/by-sa/1.0/",7],["https://creativecommons.org/licenses/by-nd/2.0/",5],["https://creativecommons.org/licenses/by/3.0/br/deed.en",4],["https://creativecommons.org/licenses/by-sa/2.5/",2],["https://creativecommons.org/licenses/by-nc-sa/4.0",1]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":16,"null_rate":0.0,"stats":{"cardinality":16,"entropy":1.3227594126157038,"entropy_ratio":0.33068985315392596,"top_rate":0.79842784952274,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"99 singleton categories"}],"column":"MapCredits","extras":{"singletons":99,"top_values":[["People Group data: Omid.  Map geography: UNESCO / GMI.  Map Design: Joshua Project",1995],["",1505],["Location: IMB. Imagery: GMI, ESRI, Maxar, Earthstar Geographics, ESRI User Community. Design: Joshua Project.",808],["People Group data: Omid.  Map geography: UNESCO / GMI.  Map Design: Joshua Project.",755],["People Group Location: Omid. Other geography / data: GMI. Map Design: Joshua Project",583],["Bethany World Prayer Center",408],["Joshua Project / Global Mapping International",335],["Bryan Nicholson / cartoMission",100],["Location: SIL / WLMS. Imagery: GMI, ESRI, Maxar, Earthstar Geographics, ESRI User Community. Design: Joshua Project.",77],["Anonymous",70],["Location: WLMS. Imagery: GMI, ESRI, Maxar, Earthstar Geographics, ESRI User Community. Design: Joshua Project.",47],["NCRP",44],["Location: Web research. Imagery: GMI, ESRI, Maxar, Earthstar Geographics, ESRI User Community. Design: Joshua Project.",31],["Asia Harvest-Operation Myanmar",26],["Location: World Jewish Congress, Imagery: GMI, ESRI, Maxar, Earthstar Geographics, ESRI User Community. Design: Joshua Project.",26],["Location: Joshua Project. Imagery: GMI, ESRI, Maxar, Earthstar Geographics, ESRI User Community. Design: Joshua Project.",23],["Southeast Asia Link - SEALINK",21],["Location: Ethnologue. Imagery: GMI, ESRI, Maxar, Earthstar Geographics, ESRI User Community. Design: Joshua Project.",18],["Location: Asia Harvest. Imagery: GMI, ESRI, Maxar, Earthstar Geographics, ESRI User Community. Design: Joshua Project.",10],["Peoples of the Red Book",8]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":161,"null_rate":0.0,"stats":{"cardinality":161,"entropy":3.318395487912014,"entropy_ratio":0.4526576338382174,"top_rate":0.2800393037619315,"top_value":"People Group data: Omid.  Map geography: UNESCO / GMI.  Map Design: Joshua Project"}},{"alerts":[{"code":"long_tail","level":"info","message":"19 singleton categories"},{"code":"imbalance","level":"warn","message":"top value is 97.1% of rows"}],"column":"MapCreditURL","extras":{"singletons":19,"top_values":[["",6919],["https://www.cartomission.com",100],["https://www.asiaharvest.org",28],["https://www.worldjewishcongress.org/",26],["https://www.eki.ee/books/redbook/introduction.shtml",8],["https://commons.wikimedia.org/wiki/File:Maeneo_penye_wasemaji_wa_Kiswahili.png",7],["https://www.npolar.no/ansipra/english/Indexpages/Map_index.html",5],["https://www.face-music.ch/bi_bid/trad_costumes_en.html",3],["https://thekurds.net/",3],["https://www.cartpioneers.org/products/Peoples-of-Yemen-Prayer-Guide.html",2],["http://lingvarium.org/",2],["https://www.westmelanesia.com/",2],["https://www.lib.utexas.edu/maps/africa/libya_ethnic_1974.jpg",1],["https://commons.wikimedia.org/wiki/File:Libya_ethnic.svg",1],["https://www.ssb.no/en/statbank/table/09817/tableViewLayout1/",1],["https://commons.wikimedia.org/wiki/File:Alawites_in_the_Levant.jpg",1],["https://zolimacitymag.com/keeping-hakka-culture-alive-the-story-of-hong-kongs-mountain-pioneers/",1],["https://www.cia.gov/the-world-factbook/countries/china/map/",1],["https://commons.wikimedia.org/wiki/File:Albanians_in_Kosovo_2011_census.GIF",1],["https://www.refworld.org/docid/4a8414f5c.html",1]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":31,"null_rate":0.0,"stats":{"cardinality":31,"entropy":0.26995629097399637,"entropy_ratio":0.05449043075019274,"top_rate":0.9712240314430095,"top_value":""}},{"alerts":[],"column":"MapCopyright","extras":{"singletons":0,"top_values":[["N",5197],["",1885],["Y",42]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":3,"null_rate":0.0,"stats":{"cardinality":3,"entropy":0.883127355260391,"entropy_ratio":0.5571913246266514,"top_rate":0.7295058955642897,"top_value":"N"}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 99.9% of rows"}],"column":"MapCCVersionText","extras":{"singletons":2,"top_values":[["",7114],["CC BY-SA 3.0",8],["CC0 1.0",1],["CC BY 3.0",1]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":4,"null_rate":0.0,"stats":{"cardinality":4,"entropy":0.016620092375341105,"entropy_ratio":0.008310046187670552,"top_rate":0.9985962942167321,"top_value":""}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 99.9% of rows"}],"column":"MapCCVersionURL","extras":{"singletons":2,"top_values":[["",7114],["https://creativecommons.org/licenses/by-sa/3.0/",8],["https://creativecommons.org/publicdomain/zero/1.0/",1],["https://creativecommons.org/licenses/by/3.0/",1]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":4,"null_rate":0.0,"stats":{"cardinality":4,"entropy":0.016620092375341105,"entropy_ratio":0.008310046187670552,"top_rate":0.9985962942167321,"top_value":""}},{"alerts":[],"column":"JF","extras":{"singletons":0,"top_values":[["Y",5610],["N",1514]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":2,"null_rate":0.0,"stats":{"cardinality":2,"entropy":0.7462740906620023,"entropy_ratio":0.7462740906620023,"top_rate":0.787478944413251,"top_value":"Y"}},{"alerts":[],"column":"AudioRecordings","extras":{"singletons":0,"top_values":[["Y",6188],["N",936]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":2,"null_rate":0.0,"stats":{"cardinality":2,"entropy":0.5612294270509872,"entropy_ratio":0.5612294270509872,"top_rate":0.8686131386861314,"top_value":"Y"}},{"alerts":[],"column":"Window1040","extras":{"singletons":0,"top_values":[["Y",5910],["N",1214]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":2,"null_rate":0.0,"stats":{"cardinality":2,"entropy":0.6586415570774855,"entropy_ratio":0.6586415570774855,"top_rate":0.8295901179112858,"top_value":"Y"}},{"alerts":[{"code":"one_word","level":"warn","message":"100.0% rows are a single word"},{"code":"url_heavy","level":"info","message":"78.9% rows contain a URL"},{"code":"duplicates","level":"warn","message":"35.2% duplicate strings"}],"column":"PeopleGroupMapURL","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[1500,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3833,1791],"edges":[0.0,1.65,3.3,4.949999999999999,6.6,8.25,9.899999999999999,11.549999999999999,13.2,14.85,16.5,18.15,19.799999999999997,21.45,23.099999999999998,24.75,26.4,28.049999999999997,29.7,31.349999999999998,33.0,34.65,36.3,37.949999999999996,39.599999999999994,41.25,42.9,44.55,46.199999999999996,47.849999999999994,49.5,51.15,52.8,54.449999999999996,56.099999999999994,57.75,59.4,61.05,62.699999999999996,64.35,66.0]},"near_unique":false,"sample":["https://joshuaproject.net/assets/media/profiles/maps/m10375.png","https://joshuaproject.net/assets/media/profiles/maps/m21769.png","https://joshuaproject.net/assets/media/profiles/maps/m14244_ni.png","https://joshuaproject.net/assets/media/profiles/maps/m10824_pu.png","https://joshuaproject.net/assets/media/profiles/maps/m16828.png","","https://joshuaproject.net/assets/media/profiles/maps/m17080.png","","https://joshuaproject.net/assets/media/profiles/maps/m10949_cm.png","https://joshuaproject.net/assets/media/profiles/maps/m13819_no.png","https://joshuaproject.net/assets/media/profiles/maps/m19198.png","https://joshuaproject.net/assets/media/profiles/maps/m17745.png","https://joshuaproject.net/assets/media/profiles/maps/m18615_ch.png","https://joshuaproject.net/assets/media/profiles/maps/m00007.png","https://joshuaproject.net/assets/media/profiles/maps/m19808.png","","","https://joshuaproject.net/assets/media/profiles/maps/m11988_su.png","","https://joshuaproject.net/assets/media/profiles/maps/m16620.png","https://joshuaproject.net/assets/media/profiles/maps/m11478.png","https://joshuaproject.net/assets/media/profiles/maps/m13922_ag.png","","","https://joshuaproject.net/assets/media/profiles/maps/m21128.png","https://joshuaproject.net/assets/media/profiles/maps/m22047.png","https://joshuaproject.net/assets/media/profiles/maps/m17937.png","https://joshuaproject.net/assets/media/profiles/maps/m10584_rp.png","","https://joshuaproject.net/assets/media/profiles/maps/m18274_tu.png","https://joshuaproject.net/assets/media/profiles/maps/m20032.png","https://joshuaproject.net/assets/media/profiles/maps/m20236.png","https://joshuaproject.net/assets/media/profiles/maps/m20235.png","https://joshuaproject.net/assets/media/profiles/maps/m16501.png","https://joshuaproject.net/assets/media/profiles/maps/m16278.png","https://joshuaproject.net/assets/media/profiles/maps/m16944.png","","https://joshuaproject.net/assets/media/profiles/maps/m17590.png","https://joshuaproject.net/assets/media/profiles/maps/m17067.png","https://joshuaproject.net/assets/media/profiles/maps/m17721.png","https://joshuaproject.net/assets/media/profiles/maps/m00005.png","https://joshuaproject.net/assets/media/profiles/maps/m18628_ch.png","","https://joshuaproject.net/assets/media/profiles/maps/m18617.png","","","","https://joshuaproject.net/assets/media/profiles/maps/m16514.png","https://joshuaproject.net/assets/media/profiles/maps/m10839_aj.png","https://joshuaproject.net/assets/media/profiles/maps/m16100_bn.png"],"top_values":[["",1500],["https://joshuaproject.net/assets/media/profiles/maps/m00328.png",40],["https://joshuaproject.net/assets/media/profiles/maps/m00007.png",33],["https://joshuaproject.net/assets/media/profiles/maps/m00077.png",19],["https://joshuaproject.net/assets/media/profiles/maps/m00040.png",14],["https://joshuaproject.net/assets/media/profiles/maps/m00005.png",13],["https://joshuaproject.net/assets/media/profiles/maps/m00079.png",13],["https://joshuaproject.net/assets/media/profiles/maps/m14256.png",13],["https://joshuaproject.net/assets/media/profiles/maps/m00081.png",12],["https://joshuaproject.net/assets/media/profiles/maps/m00068.png",10],["https://joshuaproject.net/assets/media/profiles/maps/m00273.png",10],["https://joshuaproject.net/assets/media/profiles/maps/m00034.png",8],["https://joshuaproject.net/assets/media/profiles/maps/m14322.png",8],["https://joshuaproject.net/assets/media/profiles/maps/m00305.png",8],["https://joshuaproject.net/assets/media/profiles/maps/m18084.png",8],["https://joshuaproject.net/assets/media/profiles/maps/m00033.png",7],["https://joshuaproject.net/assets/media/profiles/maps/m00028.png",7],["https://joshuaproject.net/assets/media/profiles/maps/m00009.png",6],["https://joshuaproject.net/assets/media/profiles/maps/m00042.png",6],["https://joshuaproject.net/assets/media/profiles/maps/m11359.png",6]],"top_words":[["https://joshuaproject.net/assets/media/profiles/maps/m00328.png",40],["https://joshuaproject.net/assets/media/profiles/maps/m00007.png",33],["https://joshuaproject.net/assets/media/profiles/maps/m00077.png",19],["https://joshuaproject.net/assets/media/profiles/maps/m00040.png",14],["https://joshuaproject.net/assets/media/profiles/maps/m00005.png",13],["https://joshuaproject.net/assets/media/profiles/maps/m00079.png",13],["https://joshuaproject.net/assets/media/profiles/maps/m14256.png",13],["https://joshuaproject.net/assets/media/profiles/maps/m00081.png",12],["https://joshuaproject.net/assets/media/profiles/maps/m00068.png",10],["https://joshuaproject.net/assets/media/profiles/maps/m00273.png",10],["https://joshuaproject.net/assets/media/profiles/maps/m00034.png",8],["https://joshuaproject.net/assets/media/profiles/maps/m14322.png",8],["https://joshuaproject.net/assets/media/profiles/maps/m00305.png",8],["https://joshuaproject.net/assets/media/profiles/maps/m18084.png",8],["https://joshuaproject.net/assets/media/profiles/maps/m00033.png",7],["https://joshuaproject.net/assets/media/profiles/maps/m00028.png",7],["https://joshuaproject.net/assets/media/profiles/maps/m00009.png",6],["https://joshuaproject.net/assets/media/profiles/maps/m00042.png",6],["https://joshuaproject.net/assets/media/profiles/maps/m11359.png",6],["https://joshuaproject.net/assets/media/profiles/maps/m16318.png",6],["https://joshuaproject.net/assets/media/profiles/maps/m00015.png",5],["https://joshuaproject.net/assets/media/profiles/maps/m00306.png",5],["https://joshuaproject.net/assets/media/profiles/maps/m00334.png",5],["https://joshuaproject.net/assets/media/profiles/maps/m16187.png",5],["https://joshuaproject.net/assets/media/profiles/maps/m16521.png",5]],"vocab_skipped":null,"word_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,7124,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[0.5,0.5333333333333333,0.5666666666666667,0.6,0.6333333333333333,0.6666666666666666,0.7,0.7333333333333334,0.7666666666666666,0.8,0.8333333333333333,0.8666666666666667,0.9,0.9333333333333333,0.9666666666666667,1.0,1.0333333333333332,1.0666666666666667,1.1,1.1333333333333333,1.1666666666666665,1.2,1.2333333333333334,1.2666666666666666,1.3,1.3333333333333335,1.3666666666666667,1.4,1.4333333333333333,1.4666666666666668,1.5]}},"kind":"text","n":7124,"n_null":0,"n_unique":4616,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.352049410443571,"emoji_rate":0.0,"len_max":66,"len_mean":50.489191465468835,"len_median":63.0,"len_min":0,"len_p95":66.0,"n_duplicates":2508,"n_empty":1500,"one_word_rate":1.0,"readability_flesch_mean":-568.6555999999999,"url_rate":0.7894441325098259,"vocab_size":4615,"word_mean":1.0,"word_median":1.0}},{"alerts":[{"code":"one_word","level":"warn","message":"100.0% rows are a single word"},{"code":"url_heavy","level":"info","message":"72.3% rows contain a URL"},{"code":"duplicates","level":"warn","message":"39.2% duplicate strings"}],"column":"PeopleGroupMapExpandedURL","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[1975,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3579,1570],"edges":[0.0,1.65,3.3,4.949999999999999,6.6,8.25,9.899999999999999,11.549999999999999,13.2,14.85,16.5,18.15,19.799999999999997,21.45,23.099999999999998,24.75,26.4,28.049999999999997,29.7,31.349999999999998,33.0,34.65,36.3,37.949999999999996,39.599999999999994,41.25,42.9,44.55,46.199999999999996,47.849999999999994,49.5,51.15,52.8,54.449999999999996,56.099999999999994,57.75,59.4,61.05,62.699999999999996,64.35,66.0]},"near_unique":false,"sample":["https://joshuaproject.net/assets/media/profiles/maps/m10375.pdf","https://joshuaproject.net/assets/media/profiles/maps/m21769.pdf","https://joshuaproject.net/assets/media/profiles/maps/m14244_ni.pdf","","https://joshuaproject.net/assets/media/profiles/maps/m16828.pdf","","https://joshuaproject.net/assets/media/profiles/maps/m17080.pdf","","https://joshuaproject.net/assets/media/profiles/maps/m10949_cm.pdf","https://joshuaproject.net/assets/media/profiles/maps/m13819_no.pdf","https://joshuaproject.net/assets/media/profiles/maps/m19198.pdf","https://joshuaproject.net/assets/media/profiles/maps/m17745.pdf","https://joshuaproject.net/assets/media/profiles/maps/m18615_ch.pdf","","https://joshuaproject.net/assets/media/profiles/maps/m19808.pdf","","","https://joshuaproject.net/assets/media/profiles/maps/m11988_su.pdf","","https://joshuaproject.net/assets/media/profiles/maps/m16620.pdf","https://joshuaproject.net/assets/media/profiles/maps/m11478.pdf","https://joshuaproject.net/assets/media/profiles/maps/m13922_ag.pdf","","","https://joshuaproject.net/assets/media/profiles/maps/m21128.pdf","https://joshuaproject.net/assets/media/profiles/maps/m22047.pdf","https://joshuaproject.net/assets/media/profiles/maps/m17937.pdf","https://joshuaproject.net/assets/media/profiles/maps/m10584_rp.pdf","","https://joshuaproject.net/assets/media/profiles/maps/m18274_tu.pdf","https://joshuaproject.net/assets/media/profiles/maps/m20032.pdf","https://joshuaproject.net/assets/media/profiles/maps/m20236.pdf","https://joshuaproject.net/assets/media/profiles/maps/m20235.pdf","https://joshuaproject.net/assets/media/profiles/maps/m16501.pdf","https://joshuaproject.net/assets/media/profiles/maps/m16278.pdf","https://joshuaproject.net/assets/media/profiles/maps/m16944.pdf","","https://joshuaproject.net/assets/media/profiles/maps/m17590.pdf","https://joshuaproject.net/assets/media/profiles/maps/m17067.pdf","https://joshuaproject.net/assets/media/profiles/maps/m17721.pdf","","https://joshuaproject.net/assets/media/profiles/maps/m18628_ch.pdf","","https://joshuaproject.net/assets/media/profiles/maps/m18617.pdf","","","","https://joshuaproject.net/assets/media/profiles/maps/m16514.pdf","https://joshuaproject.net/assets/media/profiles/maps/m10839_aj.pdf","https://joshuaproject.net/assets/media/profiles/maps/m16100_bn.pdf"],"top_values":[["",1975],["https://joshuaproject.net/assets/media/profiles/maps/m00328.pdf",40],["https://joshuaproject.net/assets/media/profiles/maps/m14256.pdf",13],["https://joshuaproject.net/assets/media/profiles/maps/m14322.pdf",8],["https://joshuaproject.net/assets/media/profiles/maps/m00305.pdf",8],["https://joshuaproject.net/assets/media/profiles/maps/m18084.pdf",8],["https://joshuaproject.net/assets/media/profiles/maps/m11359.pdf",6],["https://joshuaproject.net/assets/media/profiles/maps/m16318.pdf",6],["https://joshuaproject.net/assets/media/profiles/maps/m00306.pdf",5],["https://joshuaproject.net/assets/media/profiles/maps/m00334.pdf",5],["https://joshuaproject.net/assets/media/profiles/maps/m16187.pdf",5],["https://joshuaproject.net/assets/media/profiles/maps/m16521.pdf",5],["https://joshuaproject.net/assets/media/profiles/maps/m16709.pdf",5],["https://joshuaproject.net/assets/media/profiles/maps/m18045.pdf",5],["https://joshuaproject.net/assets/media/profiles/maps/m18150.pdf",5],["https://joshuaproject.net/assets/media/profiles/maps/m19655.pdf",5],["https://joshuaproject.net/assets/media/profiles/maps/m00333.pdf",4],["https://joshuaproject.net/assets/media/profiles/maps/m16221.pdf",4],["https://joshuaproject.net/assets/media/profiles/maps/m16297.pdf",4],["https://joshuaproject.net/assets/media/profiles/maps/m16333.pdf",4]],"top_words":[["https://joshuaproject.net/assets/media/profiles/maps/m00328.pdf",40],["https://joshuaproject.net/assets/media/profiles/maps/m14256.pdf",13],["https://joshuaproject.net/assets/media/profiles/maps/m14322.pdf",8],["https://joshuaproject.net/assets/media/profiles/maps/m00305.pdf",8],["https://joshuaproject.net/assets/media/profiles/maps/m18084.pdf",8],["https://joshuaproject.net/assets/media/profiles/maps/m11359.pdf",6],["https://joshuaproject.net/assets/media/profiles/maps/m16318.pdf",6],["https://joshuaproject.net/assets/media/profiles/maps/m00306.pdf",5],["https://joshuaproject.net/assets/media/profiles/maps/m00334.pdf",5],["https://joshuaproject.net/assets/media/profiles/maps/m16187.pdf",5],["https://joshuaproject.net/assets/media/profiles/maps/m16521.pdf",5],["https://joshuaproject.net/assets/media/profiles/maps/m16709.pdf",5],["https://joshuaproject.net/assets/media/profiles/maps/m18045.pdf",5],["https://joshuaproject.net/assets/media/profiles/maps/m18150.pdf",5],["https://joshuaproject.net/assets/media/profiles/maps/m19655.pdf",5],["https://joshuaproject.net/assets/media/profiles/maps/m00333.pdf",4],["https://joshuaproject.net/assets/media/profiles/maps/m16221.pdf",4],["https://joshuaproject.net/assets/media/profiles/maps/m16297.pdf",4],["https://joshuaproject.net/assets/media/profiles/maps/m16333.pdf",4],["https://joshuaproject.net/assets/media/profiles/maps/m16561.pdf",4],["https://joshuaproject.net/assets/media/profiles/maps/m17316.pdf",4],["https://joshuaproject.net/assets/media/profiles/maps/m17328.pdf",4],["https://joshuaproject.net/assets/media/profiles/maps/m17379.pdf",4],["https://joshuaproject.net/assets/media/profiles/maps/m17513.pdf",4],["https://joshuaproject.net/assets/media/profiles/maps/m17519.pdf",4]],"vocab_skipped":null,"word_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,7124,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[0.5,0.5333333333333333,0.5666666666666667,0.6,0.6333333333333333,0.6666666666666666,0.7,0.7333333333333334,0.7666666666666666,0.8,0.8333333333333333,0.8666666666666667,0.9,0.9333333333333333,0.9666666666666667,1.0,1.0333333333333332,1.0666666666666667,1.1,1.1333333333333333,1.1666666666666665,1.2,1.2333333333333334,1.2666666666666666,1.3,1.3333333333333335,1.3666666666666667,1.4,1.4333333333333333,1.4666666666666668,1.5]}},"kind":"text","n":7124,"n_null":0,"n_unique":4331,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.3920550252667041,"emoji_rate":0.0,"len_max":66,"len_mean":46.19553621560921,"len_median":63.0,"len_min":0,"len_p95":66.0,"n_duplicates":2793,"n_empty":1975,"one_word_rate":1.0,"readability_flesch_mean":-468.90979999999996,"url_rate":0.7227681078046042,"vocab_size":4330,"word_mean":1.0,"word_median":1.0}},{"alerts":[{"code":"near_unique","level":"info","message":"100.0% of rows are unique strings"},{"code":"one_word","level":"warn","message":"100.0% rows are a single word"},{"code":"url_heavy","level":"info","message":"100.0% rows contain a URL"}],"column":"PeopleGroupURL","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,7124,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[47.5,47.525,47.55,47.575,47.6,47.625,47.65,47.675,47.7,47.725,47.75,47.775,47.8,47.825,47.85,47.875,47.9,47.925,47.95,47.975,48.0,48.025,48.05,48.075,48.1,48.125,48.15,48.175,48.2,48.225,48.25,48.275,48.3,48.325,48.35,48.375,48.4,48.425,48.45,48.475,48.5]},"near_unique":true,"sample":["https://joshuaproject.net/people_groups/10375/CE","https://joshuaproject.net/people_groups/21769/IN","https://joshuaproject.net/people_groups/14244/NI","https://joshuaproject.net/people_groups/10824/PU","https://joshuaproject.net/people_groups/16828/IN","https://joshuaproject.net/people_groups/18274/LY","https://joshuaproject.net/people_groups/17080/NP","https://joshuaproject.net/people_groups/22370/NI","https://joshuaproject.net/people_groups/10949/CM","https://joshuaproject.net/people_groups/13819/NO","https://joshuaproject.net/people_groups/19198/BT","https://joshuaproject.net/people_groups/17745/IN","https://joshuaproject.net/people_groups/18615/CH","https://joshuaproject.net/people_groups/10376/MU","https://joshuaproject.net/people_groups/19808/CH","https://joshuaproject.net/people_groups/21571/BR","https://joshuaproject.net/people_groups/10161/US","https://joshuaproject.net/people_groups/11988/SU","https://joshuaproject.net/people_groups/19007/KG","https://joshuaproject.net/people_groups/16620/IN","https://joshuaproject.net/people_groups/11478/BT","https://joshuaproject.net/people_groups/13922/AG","https://joshuaproject.net/people_groups/12347/UK","https://joshuaproject.net/people_groups/11317/FR","https://joshuaproject.net/people_groups/21128/IN","https://joshuaproject.net/people_groups/22047/PK","https://joshuaproject.net/people_groups/17937/IN","https://joshuaproject.net/people_groups/10584/RP","https://joshuaproject.net/people_groups/12054/CA","https://joshuaproject.net/people_groups/18274/TU","https://joshuaproject.net/people_groups/20032/PK","https://joshuaproject.net/people_groups/20236/IN","https://joshuaproject.net/people_groups/20235/PK","https://joshuaproject.net/people_groups/16501/IN","https://joshuaproject.net/people_groups/16278/IN","https://joshuaproject.net/people_groups/16944/BG","https://joshuaproject.net/people_groups/20610/CH","https://joshuaproject.net/people_groups/17590/PK","https://joshuaproject.net/people_groups/17067/IN","https://joshuaproject.net/people_groups/17721/IN","https://joshuaproject.net/people_groups/10391/SU","https://joshuaproject.net/people_groups/18628/CH","https://joshuaproject.net/people_groups/18577/CH","https://joshuaproject.net/people_groups/18617/CH","https://joshuaproject.net/people_groups/14039/MG","https://joshuaproject.net/people_groups/20631/GG","https://joshuaproject.net/people_groups/15382/GM","https://joshuaproject.net/people_groups/16514/NP","https://joshuaproject.net/people_groups/10839/AJ","https://joshuaproject.net/people_groups/16100/BN"],"top_values":[],"top_words":[["https://joshuaproject.net/people_groups/10208/ng",1],["https://joshuaproject.net/people_groups/10301/su",1],["https://joshuaproject.net/people_groups/10375/tz",1],["https://joshuaproject.net/people_groups/10375/up",1],["https://joshuaproject.net/people_groups/10376/ae",1],["https://joshuaproject.net/people_groups/10376/ca",1],["https://joshuaproject.net/people_groups/10375/as",1],["https://joshuaproject.net/people_groups/10375/bu",1],["https://joshuaproject.net/people_groups/10375/ce",1],["https://joshuaproject.net/people_groups/10375/cg",1],["https://joshuaproject.net/people_groups/10375/gb",1],["https://joshuaproject.net/people_groups/10375/hu",1],["https://joshuaproject.net/people_groups/10375/id",1],["https://joshuaproject.net/people_groups/10375/ke",1],["https://joshuaproject.net/people_groups/10375/mk",1],["https://joshuaproject.net/people_groups/10375/my",1],["https://joshuaproject.net/people_groups/10375/pk",1],["https://joshuaproject.net/people_groups/10375/rp",1],["https://joshuaproject.net/people_groups/10375/sl",1],["https://joshuaproject.net/people_groups/10375/so",1],["https://joshuaproject.net/people_groups/10376/eg",1],["https://joshuaproject.net/people_groups/10376/ir",1],["https://joshuaproject.net/people_groups/10376/iz",1],["https://joshuaproject.net/people_groups/10376/ku",1],["https://joshuaproject.net/people_groups/10376/mu",1]],"vocab_skipped":null,"word_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,7124,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[0.5,0.5333333333333333,0.5666666666666667,0.6,0.6333333333333333,0.6666666666666666,0.7,0.7333333333333334,0.7666666666666666,0.8,0.8333333333333333,0.8666666666666667,0.9,0.9333333333333333,0.9666666666666667,1.0,1.0333333333333332,1.0666666666666667,1.1,1.1333333333333333,1.1666666666666665,1.2,1.2333333333333334,1.2666666666666666,1.3,1.3333333333333335,1.3666666666666667,1.4,1.4333333333333333,1.4666666666666668,1.5]}},"kind":"text","n":7124,"n_null":0,"n_unique":7124,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.0,"emoji_rate":0.0,"len_max":48,"len_mean":48.0,"len_median":48.0,"len_min":48,"len_p95":48.0,"n_duplicates":0,"n_empty":0,"one_word_rate":1.0,"readability_flesch_mean":-479.86299999999983,"url_rate":1.0,"vocab_size":7124,"word_mean":1.0,"word_median":1.0}},{"alerts":[{"code":"one_word","level":"warn","message":"100.0% rows are a single word"},{"code":"url_heavy","level":"info","message":"72.3% rows contain a URL"},{"code":"duplicates","level":"warn","message":"59.6% duplicate strings"}],"column":"PeopleGroupPhotoURL","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[1971,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,5092,61],"edges":[0.0,1.7,3.4,5.1,6.8,8.5,10.2,11.9,13.6,15.299999999999999,17.0,18.7,20.4,22.099999999999998,23.8,25.5,27.2,28.9,30.599999999999998,32.3,34.0,35.699999999999996,37.4,39.1,40.8,42.5,44.199999999999996,45.9,47.6,49.3,51.0,52.699999999999996,54.4,56.1,57.8,59.5,61.199999999999996,62.9,64.6,66.3,68.0]},"near_unique":false,"sample":["https://joshuaproject.net/assets/media/profiles/photos/p10375.jpg","https://joshuaproject.net/assets/media/profiles/photos/p21769.jpg","https://joshuaproject.net/assets/media/profiles/photos/p14244.jpg","https://joshuaproject.net/assets/media/profiles/photos/p10824.jpg","https://joshuaproject.net/assets/media/profiles/photos/p16828.jpg","https://joshuaproject.net/assets/media/profiles/photos/p18274.jpg","https://joshuaproject.net/assets/media/profiles/photos/p17080.jpg","","https://joshuaproject.net/assets/media/profiles/photos/p10949.jpg","https://joshuaproject.net/assets/media/profiles/photos/p13819.jpg","https://joshuaproject.net/assets/media/profiles/photos/p19198.jpg","https://joshuaproject.net/assets/media/profiles/photos/p17745.jpg","https://joshuaproject.net/assets/media/profiles/photos/p18615.jpg","https://joshuaproject.net/assets/media/profiles/photos/p10376.jpg","https://joshuaproject.net/assets/media/profiles/photos/p19808.jpg","https://joshuaproject.net/assets/media/profiles/photos/p21571.jpg","https://joshuaproject.net/assets/media/profiles/photos/p10161.jpg","","https://joshuaproject.net/assets/media/profiles/photos/p19007.jpg","","https://joshuaproject.net/assets/media/profiles/photos/p11478.jpg","https://joshuaproject.net/assets/media/profiles/photos/p13922.jpg","https://joshuaproject.net/assets/media/profiles/photos/p12347.jpg","https://joshuaproject.net/assets/media/profiles/photos/p11317.jpg","","","","https://joshuaproject.net/assets/media/profiles/photos/p10584.jpg","https://joshuaproject.net/assets/media/profiles/photos/p12054.jpg","https://joshuaproject.net/assets/media/profiles/photos/p18274.jpg","","","https://joshuaproject.net/assets/media/profiles/photos/p20235.jpg","","","https://joshuaproject.net/assets/media/profiles/photos/p16944.jpg","","","https://joshuaproject.net/assets/media/profiles/photos/p17067.jpg","https://joshuaproject.net/assets/media/profiles/photos/p17721.jpg","","https://joshuaproject.net/assets/media/profiles/photos/p18628.jpg","https://joshuaproject.net/assets/media/profiles/photos/p18577.jpg","https://joshuaproject.net/assets/media/profiles/photos/p18617.jpg","https://joshuaproject.net/assets/media/profiles/photos/p14039.jpg","https://joshuaproject.net/assets/media/profiles/photos/p20631.jpg","https://joshuaproject.net/assets/media/profiles/photos/p15382.jpg","https://joshuaproject.net/assets/media/profiles/photos/p16514.jpg","https://joshuaproject.net/assets/media/profiles/photos/p10839.jpg","https://joshuaproject.net/assets/media/profiles/photos/p16100.jpg"],"top_values":[["",1971],["https://joshuaproject.net/assets/media/profiles/photos/p19007.jpg",90],["https://joshuaproject.net/assets/media/profiles/photos/p18274.jpg",38],["https://joshuaproject.net/assets/media/profiles/photos/p14371.jpg",36],["https://joshuaproject.net/assets/media/profiles/photos/p12322.jpg",34],["https://joshuaproject.net/assets/media/profiles/photos/p19211.jpg",34],["https://joshuaproject.net/assets/media/profiles/photos/p12877.jpg",28],["https://joshuaproject.net/assets/media/profiles/photos/p14983.jpg",27],["https://joshuaproject.net/assets/media/profiles/photos/p11277.jpg",27],["https://joshuaproject.net/assets/media/profiles/photos/p13819.jpg",25],["https://joshuaproject.net/assets/media/profiles/photos/p15727.jpg",24],["https://joshuaproject.net/assets/media/profiles/photos/p15104.jpg",23],["https://joshuaproject.net/assets/media/profiles/photos/p13317.jpg",23],["https://joshuaproject.net/assets/media/profiles/photos/p13437.jpg",22],["https://joshuaproject.net/assets/media/profiles/photos/p19314.jpg",21],["https://joshuaproject.net/assets/media/profiles/photos/p10953.jpg",20],["https://joshuaproject.net/assets/media/profiles/photos/p11982.jpg",20],["https://joshuaproject.net/assets/media/profiles/photos/p14483.jpg",19],["https://joshuaproject.net/assets/media/profiles/photos/p10379.jpg",18],["https://joshuaproject.net/assets/media/profiles/photos/p12247.jpg",18]],"top_words":[["https://joshuaproject.net/assets/media/profiles/photos/p19007.jpg",90],["https://joshuaproject.net/assets/media/profiles/photos/p18274.jpg",38],["https://joshuaproject.net/assets/media/profiles/photos/p14371.jpg",36],["https://joshuaproject.net/assets/media/profiles/photos/p12322.jpg",34],["https://joshuaproject.net/assets/media/profiles/photos/p19211.jpg",34],["https://joshuaproject.net/assets/media/profiles/photos/p12877.jpg",28],["https://joshuaproject.net/assets/media/profiles/photos/p14983.jpg",27],["https://joshuaproject.net/assets/media/profiles/photos/p11277.jpg",27],["https://joshuaproject.net/assets/media/profiles/photos/p13819.jpg",25],["https://joshuaproject.net/assets/media/profiles/photos/p15727.jpg",24],["https://joshuaproject.net/assets/media/profiles/photos/p15104.jpg",23],["https://joshuaproject.net/assets/media/profiles/photos/p13317.jpg",23],["https://joshuaproject.net/assets/media/profiles/photos/p13437.jpg",22],["https://joshuaproject.net/assets/media/profiles/photos/p19314.jpg",21],["https://joshuaproject.net/assets/media/profiles/photos/p10953.jpg",20],["https://joshuaproject.net/assets/media/profiles/photos/p11982.jpg",20],["https://joshuaproject.net/assets/media/profiles/photos/p14483.jpg",19],["https://joshuaproject.net/assets/media/profiles/photos/p10379.jpg",18],["https://joshuaproject.net/assets/media/profiles/photos/p12247.jpg",18],["https://joshuaproject.net/assets/media/profiles/photos/p15145.jpg",18],["https://joshuaproject.net/assets/media/profiles/photos/p10790.jpg",17],["https://joshuaproject.net/assets/media/profiles/photos/p11029.jpg",17],["https://joshuaproject.net/assets/media/profiles/photos/p10375.jpg",16],["https://joshuaproject.net/assets/media/profiles/photos/p15198.jpg",16],["https://joshuaproject.net/assets/media/profiles/photos/p14256.jpg",16]],"vocab_skipped":null,"word_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,7124,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[0.5,0.5333333333333333,0.5666666666666667,0.6,0.6333333333333333,0.6666666666666666,0.7,0.7333333333333334,0.7666666666666666,0.8,0.8333333333333333,0.8666666666666667,0.9,0.9333333333333333,0.9666666666666667,1.0,1.0333333333333332,1.0666666666666667,1.1,1.1333333333333333,1.1666666666666665,1.2,1.2333333333333334,1.2666666666666666,1.3,1.3333333333333335,1.3666666666666667,1.4,1.4333333333333333,1.4666666666666668,1.5]}},"kind":"text","n":7124,"n_null":0,"n_unique":2880,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.5957327344188658,"emoji_rate":0.0,"len_max":68,"len_mean":47.042111173498036,"len_median":65.0,"len_min":0,"len_p95":65.0,"n_duplicates":4244,"n_empty":1971,"one_word_rate":1.0,"readability_flesch_mean":-604.2824999999998,"url_rate":0.7233295901179113,"vocab_size":2879,"word_mean":1.0,"word_median":1.0}},{"alerts":[],"column":"CountryURL","extras":{"singletons":35,"top_values":[["https://joshuaproject.net/countries/IN",2032],["https://joshuaproject.net/countries/PK",767],["https://joshuaproject.net/countries/CH",442],["https://joshuaproject.net/countries/BG",256],["https://joshuaproject.net/countries/ID",234],["https://joshuaproject.net/countries/NP",184],["https://joshuaproject.net/countries/SU",168],["https://joshuaproject.net/countries/LA",142],["https://joshuaproject.net/countries/RS",115],["https://joshuaproject.net/countries/US",90],["https://joshuaproject.net/countries/IR",85],["https://joshuaproject.net/countries/CD",81],["https://joshuaproject.net/countries/MY",78],["https://joshuaproject.net/countries/TH",73],["https://joshuaproject.net/countries/VM",69],["https://joshuaproject.net/countries/TU",61],["https://joshuaproject.net/countries/BM",59],["https://joshuaproject.net/countries/AF",58],["https://joshuaproject.net/countries/CE",55],["https://joshuaproject.net/countries/CA",52]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":202,"null_rate":0.0,"stats":{"cardinality":202,"entropy":5.058444860597964,"entropy_ratio":0.660525616456381,"top_rate":0.2852330151600225,"top_value":"https://joshuaproject.net/countries/IN"}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"JPScaleText","extras":{"singletons":0,"top_values":[["Unreached",7124]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":1,"null_rate":0.0,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Unreached"}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"JPScaleImageURL","extras":{"singletons":0,"top_values":[["https://joshuaproject.net/assets/img/gauge/gauge-1.png",7124]]},"kind":"categorical","n":7124,"n_null":0,"n_unique":1,"null_rate":0.0,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"https://joshuaproject.net/assets/img/gauge/gauge-1.png"}},{"alerts":[{"code":"one_word","level":"warn","message":"44.5% rows are a single word"},{"code":"duplicates","level":"warn","message":"48.3% duplicate strings"}],"column":"Summary","extras":{"language_counts":{"__engine":"fasttext:1,092","en":1092},"language_sample_size":5000,"length_histogram":{"counts":[3167,1,1,7,16,21,40,60,76,110,144,173,162,198,208,206,243,234,207,224,253,244,196,251,143,165,85,84,60,29,18,9,10,21,50,3,2,1,0,2],"edges":[0.0,30.3,60.6,90.9,121.2,151.5,181.8,212.1,242.4,272.7,303.0,333.3,363.6,393.90000000000003,424.2,454.5,484.8,515.1,545.4,575.7,606.0,636.3000000000001,666.6,696.9,727.2,757.5,787.8000000000001,818.1,848.4,878.7,909.0,939.3000000000001,969.6,999.9,1030.2,1060.5,1090.8,1121.1000000000001,1151.4,1181.7,1212.0]},"near_unique":false,"sample":["","The traditional work of the Mansoori Muslim has been making fabric from cotton. With the development of modern fabric factories, this profession has steeply declined. Many Mansoori are now working in agriculture, in business and in the professions. With the help of the Indian educational system many of the Mansoori community have risen to becoming successful businessmen, accountants, administrators and engineers. They are endogamous, meaning they prefer marriages to occur within their people group. They often marry their cousins. Families arrange marriages. They practice monogamy, marriage between one man and one woman. Divorce is allowed if approved by the community council.","Pa'a boys are initiated into manhood between the ages of nine and eleven. Afterwards, they are taken to a shrine in the forest to be circumcised by the priest. They are taken to spend the night in the priest's house. The dodo, a masked image that represents a family ancestor, comes to scare them during the night to test their bravery. Afterward, they dance to celebrate the boys' entry into manhood. The parents arranged Pa'a marriages. Once the young man is chosen as the groom, he has the duty of helping the girl's family with farm work. He is also required to pay a bride price. There is no official wedding ceremony. Instead, after he completes a year of farm work, the man may take his wife home.","Like most of the people in West Africa, the Biafada are farmers and raise livestock. The Biafada language does not yet have any scripture at all. The people are open to hearing God's Word, yet there are many obstacles to overcome. This language group lives within the enemy's stronghold, with a strong adherence to the dominant religion of this area mixed with spirit worship. Persecution for new believers is very intense. Ten new believers were denied food and shelter, and eventually renounced their faith. Significant challenges should be expected.","The Ghosi name comes from the Sanskrit word ghush, which means \u201cto shout.\u201d The reason for this is that the Ghosi are herdsmen who are noted for shouting as they herd their cattle. The raising of cattle for their milk has been the traditional work of the Ghosi for centuries, and this continues today. They can be found in several north Indian states, most notably Uttar Pradesh, Rajasthan and West Bengal. They speak Hindi and read and write in Devanagari. They still work mainly in agriculture, especially in animal husbandry. When the father dies, property goes to the sons; except that women can keep their ornaments. The Ghosi are endogamous, meaning they prefer marriage within their group. They allow for divorce and remarriage. They have a council to settle disputes called the Jati Biradari Sabha.","","The Kandu live in India, Nepal and Bangladesh. There are no known Christian churches among them. Very few, if any, Kandu believers live in Nepal. Indeed, there are few Christians who live anywhere near them.","","The Fulani are grouped according to location, occupation and dialect. Some of the Fulani travel with their herds, others are settled, and some mix herding with farming. Since all Fulani speak a Fulfulde dialect, this suggests that they adopted the language of the people they once conquered and continue to dominate, the Hausa of northern Nigeria. The Nigerian Fulani speak Nigerian Fulfulde. They are widely regarded as troublesome by large cattle ranchers and farmers who resent having \"visitations\" by the cattle from nomadic people, and sometimes violent encounters.","Most of the Moroccan Arabs in Europe are centered around urban centers and often have to work in low paying jobs. Many of their traditions are being lost. In Norway, many of the differences have made some elements of their lives difficult.","Walang people have been traders in past times. When modern roads and transportation killed trade through the Walang area, many people were left in turmoil because they had completely relied on trade as their source of income. There were few crops planted in the Walang villages and few kept animals. They are still struggling with an economic transition.","Imagine going to the same person for both a haircut and a tooth extraction! The Nai are a working caste known for barbering and other grooming skills, but they also practice minor medical procedures. The Nai women work in jobs related to marriage celebrations, such as matchmaking and henna application. They also serve as midwives. Many children leave school after a few years to help their parents earn a living. These are their traditional occupations; however, some Nai are beginning to enter professional and modern trades. Hindi is the primary language of the Nai, but they reside throughout India, so they also speak the regional languages of their respective areas. They worship and serve the gods of the Hindu pantheon with additional influence from folk religion.","","Gulf Arabic is the dialect of Arabic spoken mainly in the eastern half of Saudi Arabia and the nearby smaller countries such as Bahrain, Qatar and the UAE. It is also spoken by some in Yemen and Oman, two countries that border Saudi Arabia. Most Omanis speak the Omani dialect of Arabic, though some speak Gulf Arabic. Oman is a rural and under-populated nation on the Arabian Peninsula. Their economy has grown considerably, partly because of the discovery of oil deposits.","","","","","","","Most of the Dakpa are farmers. Their principal crops include corn, barley, and beets. They work long hours in the fields in order to produce enough to feed their families. Other important activities include herding yaks and sheep. Since only about 3% of the land in Bhutan is available for farming, the fields are often built in terraces up the mountain sides. The most distinctive part of the Dakpa outfit is the unique felt hat. The hats are flat felt discs made from yak hair. Each hat has five tail-like \"spouts\" that allow water to drain and the head to stay dry. The Dakpa are virtually 100% Buddhist, following the \"Red Hat\" sect of Tibetan Buddhism. In addition, traditional Tibetan shamanism is practiced by some. The Dakpa remain isolated and resistant to the Gospel.","The Arab conquests of the seventh century brought about a rapid expansion of the Bedouin tribes. At that time, thousands left the Middle East and began spreading across North Africa, including Algeria, where the Nail Bedouins now live. They have adapted well to the nomadic or semi-nomadic way of life in the desert. Apart from tribal affiliations, there is little to distinguish one group of Bedouin from another.","English speaking Jewish parents in the UK encourage their children to pursue graduate educations. Jews often find their employment in medicine, law, higher education, science, and finance. Jewish scientists win the Nobel Prize many times above their percentage of the general population. One of the changes today for Judaism is that many Jews marry outside the faith resulting in children of mixed heritage. Conservative rabbis will only marry a mixed couple if the non-Jewish person is willing to convert to Judaism.","What happens when an entire people group gets a reputation for committing acts of terrorism? The Chechens in both Russia and France have been labeled terrorists. In Russia, where separatists have waged an ongoing war against the Russian government, Chechens are infamous for their acts of terrorism that often victimize innocent people.\r\n\r\nThere have been two major wars between the Russian military and the Chechens since 1990, and many Chechens have left for safer lands such as France. The Russian military demolished Grozny, the capital of Chechnya, and at one time Chechen terrorists attacked people in a Russian theater.\r\n\r\nIn the early 200s, some Chechens began to flee to France. They are often suspected of being terrorists in that country that has suffered from a number of terrorist attacks.","","","The Ramdasias are a Chamar subgroup that has the interesting distinction of being Hindu, Muslim or Sikh. The Chamar are leather workers by tradition; the word Chamar means skin worker. They are a classed as low status because of their involvement with working with dead animals. The Hindu Randasias live in the western states of India from Himachal Pradesh in the north to Gujarat in the south. Though most Chamar groups are still leather workers or weavers, most of the Ramdasias now work in agriculture or as weavers. Widows are allowed to marry but within their caste under certain conditions. ","The Bajau Kagayan are seafaring people (known as \"Sea Gypsies\") and fish in the Sulu Sea by the Philippines and Sulawesi, Indonesia. They are non-aggressive people who usually retreat from trouble. They live on their boats or on the coast in houses that are built over the sea on stilts. Their livelihood comes from the sea through fishing. The Bajau Kagayan are Sunni Muslims.","There is much speculation concerning the historical roots of the Hakka. Some claim that they were the first Chinese people to arrive in China. Others claim that the Hakka are the descendants of the Xiongnu tribe. This much is agreed upon: At various stages between the fourth and thirteenth centuries AD, large numbers of people were forced to flee their homes in the war-torn Yellow River Valley to seek refuge in southern China. These war refugees came to be known as Kejia, a Hakka word meaning \"strangers\" or \"guests.\" When the savage Mongol hordes swept across China in the thirteenth century, many Hakka fled to the south to escape the carnage. Today most of them are either in southern China or in Taiwan. A small number have migrated to Canada.","Among the younger generation of Turks, many are more focused on food, entertainment, and relationships than on religious life. While Islam is their official religion, for many it functions more as heritage than daily practice. A growing number identify with a secular worldview, shaping their identity more around modern culture than traditional faith. At the same time, many Turks have faced political and social restrictions, including limits on property ownership and employment opportunities. They need to encounter the goodness of God in ways that speak to their hearts and daily struggles. Tools like the JESUS Film and other media can be powerful avenues for sharing the gospel with them.","Muslim Autrah Jats are brave, hardworking people who possess both the desire and ability to rule. It has been said that no Jat wants to be ruled. Rather, he desires to have power over a group if not over an area. \r\n\r\nAutrah Jats take great pride in their ancestry. In fact, all the Jats in a particular village consider themselves to be the descendants of the man whom they believe founded it by the power of the sword. Most Jats live in rural areas. A small percentage are traders and laborers. Today, the Jats are well read, and some occupy high positions in academic and technical arenas.\r\n\r\nPhysically, the Jats are usually taller and heavier than most of their neighbors. Because of their larger build, their reputation for violence, and the fact that they control much of the land and village income, they are generally feared by other communities.","The name Rajput is derived from the Sanskrit word rajputra, meaning \"son of a ruler.\" Rajputs were a class of South Asian warriors and nobles for centuries. At certain times they were the warriors who conquered kingdoms and defended the land; when possible they enjoyed the life of nobles. When the British Empire began controlling parts of the Subcontinent starting in the late 1700s, they recruited Rajputs into their military. In the 20th century, Indian Prime Minister Indira Gandhi abolished the titles and property rights enjoyed by Rajputs. Today the Rajputs love to share about the military exploits of their ancestors. Some Rajputs own impressive hotels where tourists can be introduced to their proud history.","The name Rajput is derived from the Sanskrit word rajputra, meaning \"son of a ruler.\" Rajputs were the class of South Asian warriors and nobles for centuries. At certain times they were the warriors who conquered kingdoms and defended the land; when possible they enjoyed the life of nobles. When the British Empire began controlling parts of the Subcontinent starting in the late 1700s, they recruited Rajputs into their military. Today Chauhan Rajputs love to share about the military exploits of their ancestors.","","","The Ho are known for their independent nature, which has historically separated them from the rule of powerful Hindus. The tribe's culture is intertwined with the natural world. They are most comfortable in the forest environment that supplies many of their necessities. Their major agricultural crop is rice, which they ferment to make beer.","","","The Kamboh or Kamboj are a Hindu and Sikh people who live in northwest India. They claim to be descendants of royalty from Persia. During the times of the Mughuls and British, the Kamboh served in high-ranking positions in administration and in the military. Today many Kamboh own land that is worked by lower castes. The Kamboh are employed in careers of government, education, law, business, and the military. The primary language of the Kamboh is Hindi. They also speak English and regional Indian languages.","","There are many sub-Saharan tribes in Sudan that we describe as \"Arabized,\" one of which is the Tamain. They look like sub-Saharan Africans and retain a certain degree of their original culture, yet they began adopting the traditions and practices associated with Arabic Islamic culture. The process of Arabization accelerated when Sudanese Arabs filled the power vacuum at the time of independent in 1956. Arab Muslims achieved greater influence through conquest and an Arabic language-based education system.","The Southern Nasu probably originated in southern Sichuan and northern Yunnan many centuries ago. The name Nasu means \"black people.\" The color black is revered by the Nasu. They are polytheists who attempt to placate a wide array of spirits and deities. Some spirits are considered helpful while others are evil and cause death, sickness, and destruction.","","","The earliest ancestors of the Uzbeks, the Central Asian Turks, aided Genghis Khan in his conquest of Eastern Europe in the 1300s. Eventually, as unity between the Turks and Mongols faded, numerous warring kingdoms were formed. It was from several of these kingdoms that the Uzbeks descended. \r\n\r\nBy the mid-1800s, most of the Uzbeks had been conquered by the Russians. Others lived in Mongolia where they were only obliquely controlled by the Soviets after the USSR was established in 1917.","The Meskhetian Turks are a Turkish people originally from a part of southern Georgia that borders Turkey. However, under Stalin's policies during the time of the Soviet Union, the Meskhetian Turks were forcefully deported to Central Asia, where they experienced discrimination and civil rights abuses. When they were finally permitted to return to their homeland, Georgia did not allow them to resettle there. Today these people live in several countries, with the largest population in Russia. They are Muslim, but many of their traditions contain a mixture of Muslim, Caucasian and Russian elements.","","Today, Nepal is trying to preserve the environment in lands where the Bote peoples have hunted and fished for centuries. This situation has made it impossible for them to provide for themselves. The Nepali government is in the process of trying to get Bote people involved with conservation efforts and eco-tourism so they can earn a living. However, such jobs will not provide for everyone who needs one. People who speak Bote languages like Majhi are in the process of switching to Nepali.","The Jews in Azerbaijan believe they are descended from Jews taken captive by the Assyrians and displaced to the cities of the Medes. They spoke a dialect of Old Persian upon which the Azerbaijani Jewish Tat language is based. Because of their unique history and culture, the Jews of Azerbaijan have a strong sense of identity. Although they have much in common with other Jews around the world, they have a very distinctive lifestyle. Many of these Jews are Ashkenazim, descendants of Jews who inhabited the Germanic regions of Europe. After World War II, they lived in the Caucasus Mountains of the Soviet Union. Today, they are known as the \u201cMountain Jews,\u201d scattered in the mountains of Azerbaijan. Some continue to follow the Law of Moses while others have intermarried with Muslims.","Beginning in the 15th century, the Zerma-Songhai peoples made up an empire that controlled most of central and western Niger. The French arrived in the early 20th century, subjugating the Zerma and their neighbors under colonial rule. Though the Zerma are no longer part of a powerful empire, they remain a proud people, resistant to change."],"top_values":[["",3167],["The name Rajput is derived from the Sanskrit word rajputra, meaning \"son of a ruler.\" Rajputs were a class of South Asian warriors and nobles for centuries. At certain times they were the warriors who conquered kingdoms and defended the land; when possible they enjoyed the life of nobles. When the British Empire began controlling parts of the Subcontinent starting in the late 1700s, they recruited Rajputs into their military. In the 20th century, Indian Prime Minister Indira Gandhi abolished the titles and property rights enjoyed by Rajputs. Today the Rajputs love to share about the military exploits of their ancestors. Some Rajputs own impressive hotels where tourists can be introduced to their proud history.",88],["Jats are brave, hardworking people who possess both the desire and ability to rule. It has been said that no Jat wants to be ruled. Rather, he desires to have power over a group if not over an area. They take great pride in their ancestry. Today, the Jats are well read, and some occupy high positions in academic and technical arenas. Physically, the Jats are usually taller and heavier than most of their neighbors. Because of their larger build, their reputation for violence, and the fact that they control much of the land and village income, they are generally feared by other communities. The Jat peoples are among the most prosperous groups in India on a per-capita basis. Ironically, because they value thriftiness and diligence, the Jats are often regarded as miserly.",74],["Members of the Bania caste are among the wealthiest people in India, and even the world. They are involved with businesses and money lending. A Bania might be the proud owner of a giant business, a small one, or he might be working in a bank. He might even own the bank. Others work in government ministries or as lawyers, judges, teachers, scholars, stockbrokers, or engineers.\r\n\r\nThey are often resented by other castes, because they lend much needed money at high interest rates. A pre-literate farmer might take a loan from a Bania only to find that a high percentage of his harvest will be taken away as interest. Bania customers often must put their farms or their gold up for collateral in case they cannot pay back their loans.",14],["Beldar are a Hindu people of India whose name means \"one who digs.\" They work in construction as those who excavate the ground and transport dirt. Other Beldar work as landless agricultural laborers. Since the Beldar do manual labor, many Hindus look down on them. Beldars are part of the fourth level caste of Hinduism, the Sudras. \r\n\r\nBeldars marry within their caste but they do not marry cousins as is often common in lower caste peoples. The government and NGOs are making efforts to educate the Beldar so that they might become part in the modern economy of India.",8],["The name Rajput is derived from the Sanskrit word rajputra, meaning \"son of a ruler.\" Rajputs were the class of South Asian warriors and nobles for centuries. At certain times they were the warriors who conquered kingdoms and defended the land; when possible they enjoyed the life of nobles. When the British Empire began controlling parts of the Subcontinent starting in the late 1700s, they recruited Rajputs into their military. Today the Rajputs love to share about the military exploits of their ancestors.",7],["The name Rajput is derived from the Sanskrit word rajputra, meaning \"son of a ruler.\" Rajputs were the class of South Asian warriors and nobles for centuries. At certain times, they were the warriors who conquered kingdoms and defended the land; when possible they enjoyed the life of nobles. When the British Empire began controlling parts of the Subcontinent starting in the late 1700s, they recruited Rajputs into their military. In the early 1970s, Indian Prime Minister Indira Gandhi abolished the titles and property rights enjoyed by Rajputs. \r\n\r\nToday the Rajputs love to share about the military exploits of their ancestors, and many of them are still in military service or own land. Wealthy Rajputs own impressive hotels where tourists can be introduced to their proud history. Those of modest means own small businesses or work as wage laborers.",7],["The name Rajput is derived from the Sanskrit word rajputra, meaning \"son of a ruler.\" Rajputs were the class of South Asian warriors and nobles for centuries. At certain times, they were the warriors who conquered kingdoms and defended the land; when possible they enjoyed the life of nobles. When the British Empire began controlling parts of the Subcontinent starting in the late 1700s, they recruited Rajputs into their military. In the early 1970s, Indian Prime Minister Indira Gandhi abolished the titles and property rights enjoyed by Rajputs. \r\n\r\nToday the Rajputs love to share about the military exploits of their ancestors, and many are still in military service or own land. Wealthy Rajputs own impressive hotels where tourists can be introduced to their proud history. Those of modest means own small businesses or work as wage laborers.",6],["The name Rajput is derived from the Sanskrit word rajputra, meaning \"son of a ruler.\" Rajputs were the class of South Asian warriors and nobles for centuries. At certain times, they were the warriors who conquered kingdoms and defended the land; when possible they enjoyed the life of nobles. When the British Empire began controlling parts of the Subcontinent starting in the late 1700s, they recruited Rajputs into their military. In the early 1970s, Indian Prime Minister Indira Gandhi abolished the titles and property rights enjoyed by Rajputs. \r\n\r\nToday Rajputs love to share about the military exploits of their ancestors, and many are still in military service or own land. Wealthy Rajputs own impressive hotels where tourists can be introduced to their proud history. Those of modest means own small businesses or work as wage laborers.",6],["Jats are brave, hardworking people who possess both the desire and ability to rule. It has been said that no Jat wants to be ruled. Rather, he desires to have power over a group if not over an area. \r\n\r\nThey take great pride in their ancestry. In fact, all the Jats in a particular village consider themselves to be the descendants of the man whom they believe founded it by the power of the sword. Most Jats live in rural areas. A small percentage are traders and laborers. Today, the Jats are well read, and some occupy high positions in academic and technical arenas.\r\n\r\nPhysically, the Jats are usually taller and heavier than most of their neighbors. Because of their larger build, their reputation for violence, and the fact that they control much of the land and village income, they are generally feared by other communities.\r\n\r\nThe Jat peoples are among the most prosperous groups in India on a per-capita basis. Ironically, because they value thriftiness and diligence, the Jats are often regarded as miserly.",5],["The Mandaeans are descendants of Jewish-Christian Gnostics (AD 150), and may be the only sect from late antiquity to identify themselves as Gnostics. Sometimes Mandaeans are called Christians of Saint John. Until recently, Mandaeans lived mainly in Iraq and Iran, but many have now fled Iraq and settled in other countries. \"A very strange and singular people, in terms of their rituals, lives in the desert near Baghdad....they are a very simple people and they claim to possess a secret law of God, which they preserve in beautiful books.\" Ricoldo da Montecroce, c 1290. Mandaeism is based more on a common heritage than on any set of religious creeds and doctrines. They venerate John the Baptist, and baptism is their central sacrament.",4],["Traditionally the Lezgin people have been an agrarian and pastoral people. They are well known for the textiles that their women weave. Some Lezgins work in food processing while others work seasonally making jewelry or weapons.",3],["The Banjara were traditionally a nomadic community, but today they more commonly are settled and work in agricultural production. They believe that they were originally Hindu and were forcibly converted to Islam. They are non-vegetarians who eat beef. The Muslim Banjara have twelve clans. They maintain cordial relations with neighboring communities and share water sources with them. They belong to the Sunni sect of Islam.",3],["The name Rajput is derived from the Sanskrit word rajputra, meaning son of a ruler. The Rajputra constitutes a class of nobility. The Rajput clans emerged as a dominant community in north and western India in the colonial period. The economic data suggests that the majority of Rajput are landowners. A large number of communities have migrated to their present habitat, and this has made them one of the most mobile groups in India.",3],["The name of the community is derived from the word sona meaning gold, and the people who work with gold are called Sunar or Sonar. Traditionally they are goldsmiths, but with the availability of better educational facilities the Sonar have become inclined towards education. They claim their social status next to that of the Brahmin. Divorce and remarriage are allowed.",3],["Sindhu Jats are brave, hardworking people who possess both the desire and ability to rule. It has been said that no Jat wants to be ruled. Rather, he desires to have power over a group if not over an area. \r\n\r\nThey take great pride in their ancestry. In fact, all the Jats in a particular village consider themselves to be the descendants of the man whom they believe founded it by the power of the sword. Most Jats live in rural areas. A small percentage are traders and laborers. Today, the Jats are well read, and some occupy high positions in academic and technical arenas.\r\n\r\nPhysically, the Jats are usually taller and heavier than most of their neighbors. Because of their larger build, their reputation for violence, and the fact that they control much of the land and village income, they are generally feared by other communities.\r\n\r\nThe Jat peoples are among the most prosperous groups in India on a per-capita basis. Ironically, because they value thriftiness and diligence, the Jats are often regarded as miserly.",3],["Though most Bashkirs live in their homeland that is now in southwestern Russia, others have fled to other countries like Belarus, Moldova, Ukraine, Kazakhstan, Turkmenistan, Tajikistan, Kyrgyzstan, Azerbaijan, and Armenia. Bashkir cuisine is heavy on dairy products. Their traditional dish is bishbarmaq, with includes boiled meat and a type of noodle covered with herbs, onions and cheese. The Bashkirs love their folklore which is usually about their early history. It includes aspects of worldly wisdom, morals and social aspirations. These are in the form of mythology, fairy tales and legends. They are especially fond of poetry.",3],["The Karakalpaks are generally poor, and unemployment is high, but people do what they can to make a living, working on their vegetable plots and gardens, fishing, selling at markets, raising some livestock, doing casual or seasonal jobs, etc. There is no social security system, just a network of local makankenes committees who can provide temporary support for the destitute. Karakalpak societies are patrilineal, which means that the line of descent is traced through the males. Large families are the ideal, and the nuclear family is composed of as many as four generations in the same household. The Karakalpaks believe that families who share meals together will stay very close.",3],["The Izarguien are Saharan Arabs, a sub-group of the Tekna tribe. They adhere to the Maliki branch of Sunni Islam. The Tekna is a tribal confederation of Berber and Arab origins in southern Morocco and parts of northern Western Sahara. The Tekna tribes speak the Hassaniya Arabic and Berber Tamazight languages. Their traditional lifestyle was partly nomadic, based on camel and goat herding, and partly sedentary, controlling important routes of the Saharan caravan trade.",2],["The term \"Moor\" is generally applied to any person, regardless of skin color, who speaks one of the Hassaniya dialects. Therefore, there are both black and white Moors who speak the same language. The Moors are primarily farmers. However, the Black and White Moors of Morocco are relatively urbanized and work in various trades. This has caused the traditional structures of Moorish society to change considerably. The Moors are a very proud people, conveying a sense of superiority to others in the area. Parents pre-arrange marriages, with the groom's father requesting the hand of the bride. A Moorish woman does not marry against her family's wishes.",2]],"top_words":[["the",21416],["and",10210],["of",10092],["in",8831],["are",6680],["they",6104],["a",5776],["to",5738],["their",4915],["is",3345],["have",2716],["as",2379],["people",2126],["for",2088],["from",1796],["live",1677],["with",1462],["that",1412],["who",1373],["most",1354],["many",1314],["by",1309],["or",1224],["some",1185],["were",1025]],"vocab_skipped":null,"word_histogram":{"counts":[3167,2,11,19,43,99,111,181,237,224,298,293,339,258,377,304,218,306,169,189,108,57,18,12,6,45,28,2,1,2],"edges":[1.0,7.7,14.4,21.1,27.8,34.5,41.2,47.9,54.6,61.300000000000004,68.0,74.7,81.4,88.10000000000001,94.8,101.5,108.2,114.9,121.60000000000001,128.3,135.0,141.70000000000002,148.4,155.1,161.8,168.5,175.20000000000002,181.9,188.6,195.3,202.0]}},"kind":"text","n":7124,"n_null":0,"n_unique":3685,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.00028074115665356543,"duplicate_rate":0.4827344188658057,"emoji_rate":0.0,"len_max":1212,"len_mean":309.70087029758565,"len_median":316.0,"len_min":0,"len_p95":793.0,"n_duplicates":3439,"n_empty":3167,"one_word_rate":0.4445536215609208,"readability_flesch_mean":30.396914710475183,"url_rate":0.0,"vocab_size":24501,"word_mean":51.25926445816957,"word_median":52.0}},{"alerts":[{"code":"one_word","level":"warn","message":"44.5% rows are a single word"},{"code":"duplicates","level":"warn","message":"48.9% duplicate strings"}],"column":"Obstacles","extras":{"language_counts":{"__engine":"fasttext:2,805","en":2805},"language_sample_size":5000,"length_histogram":{"counts":[3167,1,24,103,198,293,407,420,353,355,265,223,173,161,232,87,222,194,69,39,31,24,11,8,9,13,12,4,7,3,4,4,1,0,2,1,0,2,1,1],"edges":[0.0,18.15,36.3,54.449999999999996,72.6,90.75,108.89999999999999,127.04999999999998,145.2,163.35,181.5,199.64999999999998,217.79999999999998,235.95,254.09999999999997,272.25,290.4,308.54999999999995,326.7,344.84999999999997,363.0,381.15,399.29999999999995,417.45,435.59999999999997,453.74999999999994,471.9,490.04999999999995,508.19999999999993,526.3499999999999,544.5,562.65,580.8,598.9499999999999,617.0999999999999,635.25,653.4,671.55,689.6999999999999,707.8499999999999,726.0]},"near_unique":false,"sample":["","The Mansoori Muslims live in the west Indian state of Gujarat concentrated in the city of Ahmedabad. The gospel presence is very weak in this part of India. It will take outsiders to establish the church among the Mansooris.","There is much animosity between Christians and Muslims in Nigeria that can interfere with gospel outreach.","Spiritual opposition can be expected whenever Jesus Christ is presented. Pray this will be overcome and the people will find freedom to understand and believe.","The Ghosi live mainly in parts of India with few Christian believers. Few will ever meet someone who lives the abundant life offered by Jesus Christ.","","The Kandu of Nepal and the larger population of Kandu who live in northeast India are considered unreached. They are almost all Hindus and have been so for hundreds of years. If Christian workers came to live among them, they would be considered outsiders and foreigners. It would take time to gain their trust.","","There is much conflict between settled Christian and Muslim nomadic herders like the Nigerian Fulani. This brings an extra layer of resistance to the gospel.","Maintaining their identity while being surrounded by European culture is very important to many Moroccan Arabs. This can limit openness to the gospel.","Walang people adhere to Buddhism. The Walang are a desperately needy unreached people group. They have no Scripture, JESUS Film or gospel recordings in their heart language, Walungge. Few have ever been exposed to the gospel in a meaningful way that would allow them to intelligently accept or reject Christ. It is extremely difficult for outsiders to get to rural Bhutan.","Many Nai are illiterate or functionally illiterate. The gospel needs to be shared with them in oral and visual forms.","","The needs of the Omanis are mainly spiritual. They have very few chances to hear about the only Savior, and they have remained closed to ideas outside of their sect of Islam. Salvation by the grace of a sin-free Savior is a foreign and threatening concept","","","","","","","Geographic isolation makes access to the Dakpa difficult, and the country of Bhutan does not welcome Christian witness.","The Nail Bedouins are isolated because they often move from place to place. Christian missionaries have always been reluctant to live among nomadic peoples. Thus the Nail and other Bedouin tribes remain with no one to challenge their folk Islamic beliefs.","Though it's unfair, Jewish people often consider the atrocities against Jews through the ages as being from Christians. They do not understand living Christianity.","As Muslims, the Chechens have been taught from an early age that they must be Muslim and there are no other choices. France's secular environment and traditions based Christianity show no good alternatives for the Muslim populations.","","","The Ramdasias live in places like Rajasthan that have an exceptionally low number of Christians. The only way for them to hear the gospel preached will be if someone goes to them from elsewhere.","Establishing trust with the Muslim Bajau Kagayan people may be difficult.","The gospel, and Jesus himself are often viewed as foreign to people from East Asia.","Christianity is widely seen as a foreign religion, belonging to others and not to Turks themselves. Because of this perception, few are willing to risk the shame or rejection that might come from openly following Christ.","Autrah Jats have a very good self-image. \"Men may come and men may go, but I go on forever,\" is a well-known Jat proverb. This sense of pride and accomplishment, along with a popular South Asian misconception that Christianity is only for the downcast, closes Autrah Jat hearts to responding to the gospel.","Rajputs have a strong sense of pride in their historical exploits. Even today they enjoy high status which reinforces that pride. Pride of the wrong sort is anathema to our Lord, and Rajputs will need to overcome this spiritual obstacle and accept the Kingdom of God like small children if they are going to enter it.","Chauhan Rajputs have a strong sense of pride in their historical exploits. Even today they enjoy high status which reinforces that pride. Pride is anathema to our Lord, and Rajputs will need to overcome this spiritual obstacle and accept the Kingdom of God like small children if they are going to enter it.","","","The New Testament is printed in the Ho language and some mission agencies work among them. Mission efforts have led to a small community of Christ followers, but there is a need for more outreach.","","","The Kamboh occupy a high place in Indian society. Their pride, wealth and position may prevent them from humbly coming to Christ.","","Unlike some other Arabs, Sudanese Arabs have no Christian tradition. As they \"Arabized\" the tribes in Sudan, they made a point of spreading Islam along with Arabic culture. For this reason, Arabized tribes like the Temain are almost entirely Muslim, and v","Today most Southern Nasu have no knowledge of Christianity. Much is needed in the way of models of Christian behavior as well as in formal instruction.","","","Most Uzbeks are Muslim in name only. A good number of them are very secularized.","Lack of prayer and lack of obedience to the command of Christ to preach the good news to all creation continues to slow the advance of the gospel.","","The Bote-Majhi people live in a place where there is little access for those who can take them the gospel.","Reaching them will require overcoming entrenched religious systems and political and geographical barriers.","Although there appears to be a strict adherence to Islam on the surface, many Zerma also incorporate animistic practices into their daily life resulting in a type of folk Islam which brings more spiritual baggage. Only about 10 percent of the Zerma are literate, so those who take them the gospel will need to rely on non-printed materials."],"top_values":[["",3167],["Rajputs have a strong sense of pride in their historical exploits. Even today they enjoy high status which reinforces that pride. Pride of the wrong sort is anathema to our Lord, and Rajputs will need to overcome this spiritual obstacle and accept the Kingdom of God like small children if they are going to enter it.",88],["Overall, the Jats have a good self-image. \"Men may come and men may go, but I go on forever,\" is a well-known Jat proverb. This sense of pride and accomplishment, along with a popular South Asian misconception that Christianity is only for the downcast, closes Jat hearts to responding to the gospel.",74],["The Beldars consider their basic identity is to be Hindu. Much prayer and the power of the Holy Spirit will be necessary to bring the Beldar into a saving knowledge of Christ.",8],["The Hindi speaking diaspora needs to find a new love\u2014a love for Jesus Christ, the one who offers them life to the full. As it stands, most are satisfied with religion.",7],["Overall, the Jats have a very good self-image. \"Men may come and men may go, but I go on forever,\" is a well-known Jat proverb. This sense of pride and accomplishment, along with a popular South Asian misconception that Christianity is only for the downcast, closes Jat hearts to responding to the gospel.",7],["For many Bosniaks, Islamic identity has more to do with cultural roots than with religious beliefs. Even among most religious Bosniaks, there is a disdain for religious leaders exercising any influence over day-to-day life. Bosniaks are no different than ",6],["Their nomadic lifestyle has made it difficult for workers to reach them. The Islamic religion is very difficult to influence.",5],["Fear of the spirit world and a suspicion that putting faith in Christ will alienate them from their communities are two major obstacles.",5],["Until the twentieth century, most Azeri identified themselves as Muslims rather than Azerbaijani or Turks. They believe that being a \"spiritual community of Islam\" was much more important than being a nation.",5],["After centuries of isolation the Mandaeans are quite insular and protective of their society and their religion. Christian resources are limited in their mother tongue.",4],["Bosniaks are no different than other Muslims in that they view Islam as a key part of their cultural foundation. Turning to various forms of Christianity is like joining the enemy.",4],["No matter where they live, the Thai believe that \u201cto be Thai is to be Buddhist.\u201d They are polite, but not open to the ways of Jesus.",4],["The Burmese are dedicated to Buddhism, and it is central to their identity.",4],["Karakalpaks are overwhelmingly Sunni Muslim. Few have heard a fair gospel presentation or seen Christianity lived out in someone's life.",4],["There is little or no Christian witness, nor any example of living Christianity for the Najdi Arabs to see or experience.",3],["For many Bosniaks, Islamic identity has more to do with cultural roots than with religious beliefs. Bosniaks are no different than other Muslims in that they view Islam as a key part of their cultural foundation. Turning to various forms of Christianity i",3],["The Lezgins and other people groups from their homeland are noted for being suspicious of outsiders, and unwilling to change their ways.",3],["Giving up allegiance to personal deities may be threatening.",3],["Hinduism breeds a mindset where there are many possibilities. Few would consider the idea that there is one God and one Savior.",3]],"top_words":[["the",7403],["to",5234],["of",3881],["and",3125],["a",2886],["in",2832],["are",2634],["is",2576],["they",2147],["their",2098],["have",1345],["for",1276],["that",1262],["people",1008],["there",971],["will",905],["with",842],["be",841],["this",818],["as",801],["not",742],["gospel",718],["from",713],["need",687],["christ",681]],"vocab_skipped":null,"word_histogram":{"counts":[3167,13,141,277,468,415,473,430,343,317,246,121,101,293,157,44,36,16,17,11,5,11,11,3,2,1,0,1,2,2],"edges":[1.0,4.833333333333334,8.666666666666668,12.5,16.333333333333336,20.166666666666668,24.0,27.833333333333336,31.666666666666668,35.5,39.333333333333336,43.16666666666667,47.0,50.833333333333336,54.66666666666667,58.5,62.333333333333336,66.16666666666667,70.0,73.83333333333334,77.66666666666667,81.5,85.33333333333334,89.16666666666667,93.0,96.83333333333334,100.66666666666667,104.5,108.33333333333334,112.16666666666667,116.0]}},"kind":"text","n":7124,"n_null":0,"n_unique":3641,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0009825940482874789,"duplicate_rate":0.4889107243121842,"emoji_rate":0.0,"len_max":726,"len_mean":106.86285794497473,"len_median":95.0,"len_min":0,"len_p95":317.0,"n_duplicates":3483,"n_empty":3167,"one_word_rate":0.4445536215609208,"readability_flesch_mean":31.624325104582795,"url_rate":0.0,"vocab_size":9760,"word_mean":18.369034250421112,"word_median":16.0}},{"alerts":[{"code":"one_word","level":"warn","message":"54.5% rows are a single word"},{"code":"duplicates","level":"warn","message":"60.0% duplicate strings"}],"column":"HowReach","extras":{"language_counts":{"__engine":"fasttext:2,291","en":2291},"language_sample_size":5000,"length_histogram":{"counts":[3883,0,1,7,61,156,252,244,277,269,274,233,219,184,357,172,135,90,103,60,39,22,24,12,9,14,5,4,3,1,3,2,1,3,0,2,2,0,0,1],"edges":[0.0,14.975,29.95,44.925,59.9,74.875,89.85,104.825,119.8,134.775,149.75,164.725,179.7,194.67499999999998,209.65,224.625,239.6,254.575,269.55,284.525,299.5,314.47499999999997,329.45,344.425,359.4,374.375,389.34999999999997,404.325,419.3,434.275,449.25,464.22499999999997,479.2,494.175,509.15,524.125,539.1,554.0749999999999,569.05,584.025,599.0]},"near_unique":false,"sample":["","Gujarati is their main language. Many also speak Urdu which allows them to communicate with most India peoples. Between these two languages, there are all kinds of gospel materials they can read, hear or see.","","There are a number of Christians in Guinea-Bissau. Pray that the Lord will lead some of these to befriend the Biafada people, and share Christ with them. Pray for boldness to do this, with tact.","","","","","Settled Christian farmers in Cameroon can reach out to the Fulani through hospitality and kindness, potentially opening the way for dialogue.","On the other hand, some Moroccan Arabs want contact with the Norwegian population. Christian believers can interact with them, sharing the blessings of Jesus Christ.","Passionate and consistent prayer is most likely the only possible outreach at this time.","","","Radio broadcasts and sending them copies of the JESUS Film might help them to find their way to the cross.","","","","","","","Translation of scripture into the Brokpake language is needed, as well as Gospel recordings. Pray for funds and workers.","Believers can bring the Nail Bedouins education and opportunities to learn new ways of earning a living. The few Algerian believers can reach out to them.","A small but growing group of Jews in the UK call themselves Messianic Jews. These Jews have accepted Jesus of Nazareth as their Messiah. They can be the beginning of a movement to Christ among English speaking Jews in the UK.","Because of the trauma Chechens have faced, most of them are likely to want to know inner peace. Islam cannot offer that. Believers can offer Bible studies that focus on finding inner peace by submitting to Jesus Christ.","","","There are Christ followers among other Chamar people who can reach these people for the Lord.","Christians can carry the good news of Jesus to the Bajau Kagayan by telling them stories from Scripture, and by using Gospel films and recordings.","Other Han Chinese people are very similar in culture to the Hakkas. They have their own churches, and they can reach out to their Hakka \"near neighbors.\"","","The Jats need clean drinking water and proper health care facilities. Christian medical teams and humanitarian aid workers are needed in rural areas to work among them and show them God's love in practical ways.","Long-standing traditions as well as spiritual forces keep Rajputs away from the Savior no matter where they live. Reaching the Rajputs would be enabled by knowledge of India's history and experience with the caste system.","Long-standing traditions as well as spiritual forces keep the Muslim Chauhan Rajputs away from the Savior. Reaching the Rajputs would be enhanced by knowledge of South Asian history and how the caste system affects their worldview.","","","Utilizing the availability of the New Testament and the already existing connections with the Ho will help to reach them. Prayer will also be an important tool.","","","Bibles, literature, films and radio programs exist in Hindi. Hindu background believers can share with the Kamboh the blessings only found in Christ.","","Christian believers can take the savior to the Arabized Temain by helping them with their medical needs.","Christians need to build bridges of friendship and trust with these people.","","","Uzbek families are extended, with a patriarchal authority ruling over several generations. Each village has an elder, and several villages comprise an elat. Each elat is governed by a council of male elders. Missionaries can make a point of reaching these male elders who can open the door for a people movement among Uzbeks.","Georgia has many Christians, mostly Orthodox but some are evangelicals. Please pray that some of these Christians will gain an interest in carrying the gospel message to the Meskhetians in their own country.","","Believers can train these people in new marketable skills that will help them adjust to their new circumstances.","","Today half of the Zerma population is under the age of 15 due to increasing birthrates and decreasing infant mortality rates. Children are much more spiritually open than their elders, so it would be a good idea for believers to reach out to them.\r\n\r\nSince only ten percent of Zerma people are literate, pray that gospel recordings, audio Bibles, and radio broadcasts will become widely available to the Zerma people."],"top_values":[["",3883],["The Jats need clean drinking water and proper health care facilities. Christian medical teams and humanitarian aid workers are needed in rural areas to work among them and show them God's love in practical ways.",136],["Long-standing traditions as well as spiritual forces keep Rajputs away from the Savior no matter where they live. Reaching the Rajputs would be enabled by knowledge of India's history and experience with the caste system.",70],["It is vital for those who go to Brahmins to build genuine relationships; they must pray for Brahmin friends, and eventually pray with Brahmin friends. We must focus on Christ himself as a living person, and on the supreme almighty God who was revealed by Christ as a loving father.",38],["Long-standing traditions as well as spiritual forces keep the Rajputs away from the Savior no matter where they live. Reaching the Rajputs would be enabled by knowledge of India's history and experience with the caste system.",18],["The JESUS Film and a Bosnian Bible are available. There is even a children's Bible, filled with stories of Jesus. These can be personally shared with Bosniaks or downloaded from computers.",14],["The JESUS film is available in the two primary languages of the Beldar, Kannada and Hindi. Radio programs would also be helpful in reaching the Beldar.",8],["The quality of health care, nutrition, housing, and education is poor, especially those who live in refugee camps. Believers with the right skills could be a blessing to the Romani by providing medical needs.",6],["South Asians come together each August 15 to celebrate Independence Day. That is a time for all religious communities to come together. Christ followers can give away copies of the JESUS Film and Bibles in Bengali.",6],["Rural Jats need clean drinking water and proper health care facilities. Christian medical teams and humanitarian aid workers are needed in rural areas to work among them and show them God's love in practical ways.",5],["Shia Muslims understand that even the righteous can face injustice and martyrdom. They might be more open to the death and resurrection of Christ than other Muslims.",5],["Mandaens now reside in some western countries, and access is easier than in the past. Christians should reach out to befriend these people, and find out more about their culture, their religion, and their world view. There are likely bridges to this people given their ancient roots in Christianity.",4],["Their animistic beliefs center around inherently evil spirits called nats. The Burmese spend their lives trying to appease the nats which Jesus Christ has already defeated. Christian believers who are familiar with spiritual warfare can demonstrate his power over these spirits.",4],["There is a complete Bible in their language. This can become available through distributions or through downloads on the internet.",4],["There are Bible portions and the JESUS Film in their language which they can access through computers.",3],["Jews for Jesus have experience in speaking to the Jewish heart. Perhaps they can reach them.",3],["Pray for the Lord to raise up a strong disciple making movement to saturate the hearts and minds of this people group.",3],["Pray that persons and households of peace will be found among the Banjara who will catalyze movements to Jesus among their own people.",3],["Sustained, focused prayer is needed to open the hearts of Rajput families to experiencing God's blessing through a movement of family-based discovery Bible studies.",3],["Pray the few believers among the Sonar will grow in sharing and discussing God's Word with their families and clans.",3]],"top_words":[["the",6258],["to",3985],["and",3248],["in",2565],["of",2363],["can",1776],["are",1468],["a",1208],["their",1165],["they",1161],["be",1151],["them",1095],["for",1026],["with",1012],["gospel",871],["who",856],["people",855],["will",834],["as",796],["there",788],["christ",787],["is",723],["believers",703],["that",678],["pray",659]],"vocab_skipped":null,"word_histogram":{"counts":[3883,2,42,157,262,431,312,391,308,224,488,173,144,69,106,52,21,21,9,6,7,4,5,1,2,2,1,0,0,1],"edges":[1.0,4.4,7.8,11.2,14.6,18.0,21.4,24.8,28.2,31.599999999999998,35.0,38.4,41.8,45.199999999999996,48.6,52.0,55.4,58.8,62.199999999999996,65.6,69.0,72.39999999999999,75.8,79.2,82.6,86.0,89.39999999999999,92.8,96.2,99.6,103.0]}},"kind":"text","n":7124,"n_null":0,"n_unique":2853,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.00028074115665356543,"duplicate_rate":0.5995227400336889,"emoji_rate":0.0,"len_max":599,"len_mean":80.82116788321167,"len_median":0.0,"len_min":0,"len_p95":260.0,"n_duplicates":4271,"n_empty":3883,"one_word_rate":0.5450589556428973,"readability_flesch_mean":27.33691586593914,"url_rate":0.0,"vocab_size":7803,"word_mean":14.0807130825379,"word_median":1.0}},{"alerts":[{"code":"one_word","level":"warn","message":"70.6% rows are a single word"},{"code":"duplicates","level":"warn","message":"76.0% duplicate strings"}],"column":"PrayForChurch","extras":{"language_counts":{"__engine":"fasttext:1,473","en":1473},"language_sample_size":5000,"length_histogram":{"counts":[5032,0,1,16,45,104,109,143,160,184,125,315,103,115,91,92,53,101,52,115,17,27,23,33,15,3,13,9,5,2,6,3,2,2,2,2,1,0,1,2],"edges":[0.0,16.225,32.45,48.675000000000004,64.9,81.125,97.35000000000001,113.57500000000002,129.8,146.025,162.25,178.47500000000002,194.70000000000002,210.925,227.15000000000003,243.37500000000003,259.6,275.82500000000005,292.05,308.27500000000003,324.5,340.725,356.95000000000005,373.175,389.40000000000003,405.62500000000006,421.85,438.07500000000005,454.30000000000007,470.52500000000003,486.75000000000006,502.975,519.2,535.4250000000001,551.6500000000001,567.875,584.1,600.325,616.5500000000001,632.7750000000001,649.0]},"near_unique":false,"sample":["","Pray for God to bless every Mansoori community economically and spiritually as a testimony of his goodness and power.\r\nPray for the followers of Christ that will soon develop within the Mansoori community, that the Lord will provide pastors and teachers for them, and for them to become well-grounded in the faith, fully trusting in Christ.\r\nPray the Mansoori community will increasingly be aware of their need to know and follow the creator God.","","There is mention of a few followers of Jesus among the Biafada in Guinea-Bissau. Pray they will reach out to their neighbors with the gospel and that they will seek encouragement in growing in the knowledge of Christ.","","","","","","Moroccan believers in Europe can be Christ's ambassadors to these Muslims.","","","","","","","","","","","There are a few followers of Christ among the Dakpa. Pray they will grow in their faith. Pray they will desire to share the good news of Christ with family and friends, not being unduly timid. Pray that scripture will soon become available in their language.","","","There are no followers of Christ among the Chechens in France, so pray for many to find Him during this time of instability.","","","Pray that the Ramdasia Chamars will find dignity and hope in Jesus Christ. Pray for workers to be thrust out to this unreached people group. Pray for a movement to Christ to happen among them this decade.","Pray for the few followers of Jesus among the \"Sea Gypsy\" people of the Philippines, that good teachers will be sent to help them grow. Pray they will be firmly established on the truths of Scripture, and will be zealous to study and learn, and be faithful disciples of Christ.","Pray that the Hakka believers will be used of God to begin a disciple making movement among their people in Canada.","","There are few followers of Christ among any Jat community. Pray that the few who answer Christ's call will be used of Him to share His glory and life-changing gospel with other Jats.","Pray that the small group of Christian believers among the Rajputs will be united in love around the truth of Scripture. Pray they live a life of love, just as Christ loved them and gave himself up for them.\r\nPray for the few Rajput believers to have the boldness to share the ways of Christ with other Rajputs.","Pray that the small group of Christian believers will be united in love around the truth of Scripture. Pray they live a life of love, just as Christ loved them and gave himself up for them.\r\nPray for the few Rajput believers to have the boldness to share the ways of Christ with other Rajputs.","","","Pray that the church would thrive and that they would spread the word to their neighbors. Pray that all conflict within the church would be resolved peacefully, with the guidance of the Holy Spirit.","","","Pray that any existing Kamboh believers might increase in numbers and that all Kamboh would have the opportunity to hear the gospel in a way they both understand and will accept.","","","There may be 100 followers of Christ among this people group. Pray they will be adequately instructed in the faith, and will increasingly trust Christ for their lives, as well as for their salvation.","","","Pray that the few followers of Christ among the Uzbeks in Mongolia will let the light of Jesus shine through them in their communities, so people can see holiness and spiritual transformation.","There are no known Christians among the Meskhetians in any country of residence.","","Pray that the few followers of Christ among the Bote Majhi people will be salt and light to their neighbors and family members.","","Pray that the small number of Zerma believers will be moved by the Holy Spirit to reach their own people."],"top_values":[["",5032],["There are few followers of Christ among any Jat community. Pray that the few who answer Christ's call will be used of Him to share His glory and life-changing gospel with other Jats.",146],["Pray that the small group of Christian believers among the Rajputs will be united in love around the truth of Scripture. Pray they live a life of love, just as Christ loved them and gave himself up for them.\r\nPray for the few Rajput believers to have the boldness to share the ways of Christ with other Rajputs.",88],["Pray that the few Brahmin-background believers will exhibit the fruit of the Holy Spirit with those they meet so that Christ will be honored and held in high esteem by these influential people.",43],["Pray that the small group of believers will be united in love around the truth of Scripture. \r\nPray they live a life of love, just as Christ loved them and gave himself up for them.\r\nPray for the few Rajput believers to have the boldness to share the ways of Christ with other Rajputs.",30],["Pray that the small group of believers will be united in love around the truth of Scripture.",19],["Pray the few followers of Christ among the Beldar peoples will live such joyful, loving and victorious lives that they will draw their Hindu neighbors to Jesus Christ.",8],["Pray that the few Brahman-background believers will exhibit the fruit of the Holy Spirit with those they meet so that Christ will be honored and held in high esteem by these influential people.",7],["There likely are no Christian believers among the Mandaeans, but pray those who will soon find Christ will be able to clearly understand the Good News of Christ, especially the grace He offers.",4],["Pray that the Holy Spirit will give the few believers among this people group the spiritual power to glorify His name among all peoples in Sri Lanka.",4],["Pray that Gond believers will live victorious lives that will draw others to the Savior.",4],["There are probably no present followers of Jesus among the Muslim Banjara community, but pray for those the Lord will soon call to himself. Pray they will have nothing to do with the deeds of darkness, living as children of light. Pray for materials to help them grow properly, such as recorded or written Scripture, and Gospel films.",3],["Pray for the few Rajput believers to be effective at engaging their families and communities in discussing Bible stories and experiencing God's blessing.",3],["There are few if any Christian believers among the Sonar, but pray for the ones that will soon be a part of this community. Pray they be well instructed in the faith, and will grow in maturity and in numbers. Pray they live holy lives.",3],["There are a few followers of Christ among the Teli. Pray that these will be fruitful and effective in sharing God's Word and blessing to strengthen their own families and spread God's blessing to other Teli households.",3],["There are no followers of Christ among the Zenaga Berbers, so pray for the Holy Spirit to move in their communities in the near future.",2],["Pray the few believers among the Regeibat will grow in sharing and discussing God's Word with their families and communities. Pray they will be accurately instructed in the faith, and that they will be strengthened by the Holy Spirit to live holy lives.",2],["There are no known Christian believers among this people at this time. Pray for hearts to begin to hunger for the forgiveness of sin found only in trust in the finished work of Jesus Christ.",2],["There are no followers of Christ who speak the Belait language. Pray that this will soon change.",2],["There are no believers among this tribal group. Pray this will soon change.",2]],"top_words":[["the",5287],["to",3297],["of",2886],["pray",2760],["and",2237],["will",2018],["for",1815],["that",1718],["in",1656],["among",1278],["be",1240],["believers",1072],["christ",1063],["they",1000],["a",946],["few",920],["there",900],["their",832],["are",812],["with",753],["followers",633],["them",570],["jesus",559],["who",545],["people",509]],"vocab_skipped":null,"word_histogram":{"counts":[5032,1,28,95,129,187,235,208,343,159,126,122,65,93,148,34,27,33,21,8,12,4,1,6,1,1,2,1,1,1],"edges":[1.0,4.766666666666667,8.533333333333333,12.3,16.066666666666666,19.833333333333332,23.6,27.366666666666667,31.133333333333333,34.9,38.666666666666664,42.43333333333333,46.2,49.96666666666667,53.733333333333334,57.5,61.266666666666666,65.03333333333333,68.8,72.56666666666666,76.33333333333333,80.1,83.86666666666666,87.63333333333333,91.4,95.16666666666667,98.93333333333334,102.7,106.46666666666667,110.23333333333333,114.0]}},"kind":"text","n":7124,"n_null":0,"n_unique":1713,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.7595451993262212,"emoji_rate":0.0,"len_max":649,"len_mean":59.63447501403706,"len_median":0.0,"len_min":0,"len_p95":286.0,"n_duplicates":5411,"n_empty":5032,"one_word_rate":0.7063447501403706,"readability_flesch_mean":19.49725852373527,"url_rate":0.0,"vocab_size":4447,"word_mean":11.193992139247614,"word_median":1.0}},{"alerts":[{"code":"one_word","level":"warn","message":"47.8% rows are a single word"},{"code":"duplicates","level":"warn","message":"51.7% duplicate strings"}],"column":"PrayForPG","extras":{"language_counts":{"__engine":"fasttext:2,528","en":2528},"language_sample_size":5000,"length_histogram":{"counts":[3406,0,6,47,86,145,136,176,159,208,212,264,274,330,321,243,275,197,240,117,76,59,43,34,22,11,11,6,11,4,3,1,0,0,0,0,0,0,0,1],"edges":[0.0,23.425,46.85,70.275,93.7,117.125,140.55,163.975,187.4,210.82500000000002,234.25,257.675,281.1,304.52500000000003,327.95,351.375,374.8,398.225,421.65000000000003,445.075,468.5,491.925,515.35,538.775,562.2,585.625,609.0500000000001,632.475,655.9,679.325,702.75,726.1750000000001,749.6,773.025,796.45,819.875,843.3000000000001,866.725,890.15,913.575,937.0]},"near_unique":false,"sample":["","","Pray for God to bring peace between Christians and Muslims in Nigeria.\r\nPray for the Lord to meet the physical and spiritual needs of the Pa'a, and that they will respond with gratitude and faith.\r\nPray for the Lord to send dreams and visions to Pa'a leaders so they will open the door for Jesus to enter the hearts of their people.\r\nPray for the Lord to send workers who are anointed by the Holy Spirit.","Pray the Biafada tribe will increasingly be drawn to Jesus (whom Muslims call Isa al-Masih) as they hear the Koran read in the mosque. Pray they will be given much curiosity to find out more about this man who is so much more than an honored prophet.","Pray that the council leaders will put their faith in Jesus and lead others into a movement to Christ.\r\nPray that gospel materials will lead them to salvation.\r\nPray for faithful intercessors and workers.\r\nAll kinds of gospel materials exist in the Hindi language, spoken by the Ghosi. Pray for them to be downloaded on their cell phones.","","Pray the Holy Spirit would create a spiritual hunger for God and his truth among the Kandu of Nepal.\r\nPray that soon there will be a movement to Christ among the Kandu in Nepal.\r\nPray the Lord would grant wisdom, safety and endurance to the workers who are now sharing the gospel with the Kandu in India.\r\nPray that the new believers among other people groups in Nepal would have a burden to reach the Kandu.\r\nPray that the Lord would build up the few known Kandu believers and use them to disciple many others.","","In the 2020s, there have been thousands of Fulani professing Christ. Pray for them to become His ambassadors throughout West Africa. Pray for the Lord to provide the Nigerian Fulani with abundant rain for their cattle as a testimony of his love and power. Pray for Nigerian Fulani elders to have dreams and visions that will point them to the only Savior.","Pray for a church planting movement among the speakers of Moroccan Arabic in Norway to grow and spread. Pray they would hear and follow the words of Jesus.","Without a single Christian believer, the Walang community will need people from India and Nepal to go to them. Pray that the Lord would raise up faithful intercessors for Walang people so there will be a strong movement to Christ among them. Pray that true churches would be planted and disciples trained among them.","Pray that a strong movement to Jesus would bring entire Nai families and communities into a rich experience of God's blessing.\r\nPray that Indian believers will build friendships with the Nai and share the gospel with them about the Savior.\r\nPray for increased access to good schools, particularly for Nai women and girls.\r\nPray for a movement to Christ that will soon bless the Nai.\r\nAsk the Lord to lead the Nai to listen to Christian radio programs in their languages.","","Pray for open hearts and minds to the ways of Christ among the Gulf speaking Arabs in Oman.\r\nPray for the Lord to raise up persons of peace to welcome Christ's ambassadors to Omani families.\r\nPray for the Lord to send His appointed workers to take Christ to this highly unreached people group.\r\nPray that there will be an unstoppable movement to Christ among every people group in Oman.","","","","","","","Pray these Buddhist peoples may be given the gift of awareness of sin, and the need for a Savior. Pray their hearts will be prepared when the good news of Christ comes to them.","Ask the Holy Spirit to grant fruitful and divine outreach strategies to mission agencies and workers focusing on Bedouins in Algeria.\r\nAsk God to raise up prayer teams who will faithfully intercede for the Nail Bedouin.\r\nAsk the Holy Spirit to complete the work that has begun in the hearts of Nail Bedouin believers in Algeria.\r\nPray for a movement to Christ this decade among the Nail and other Bedouin tribes.","Ask the Lord to send believers to build friendships with Jews of the UK and demonstrate God's love to them. Pray that God raises up a Messianic disciple making movement among the Jews of the UK. Pray that more and more Jews in the UK would be willing to investigate the claims of Jesus Christ. Pray that God would open the spiritual eyes of the Jews as they read and study the Old Testament.","Pray that followers of Christ in France will develop lasting friendships with Chechen Muslims, many of whom feel lonely and removed from their Islamic faith. \r\nPray that Chechens will receive the hope and comfort only found in the Lord. \r\nPray that Chechens in France will become strong believers who lead many of their people to the Lord.\r\nPray for the Chechens in France to form Christ-centered fellowships that will spread to Russia.","","","","Pray the Bajau Kagayan people will be able to provide adequately for their families, and be kept safe as they fish for their livelihood.","Pray for Bibles, the JESUS Film, and other Christian materials to find their way into Hakka homes in Canada.\r\n There are some Hakka believers in Canada. Pray that they will take the gospel to their kinsmen and plant churches.\r\nPray for a disciple-making movement among every Hakka people.","Ask the Lord to draw Turks to Himself through dreams and visions that reveal His glory.\r\nPray that those who believe will courageously share the gospel with their families and neighbors, and that entire communities would be touched.\r\nPray for fervent believers to reach out to Muslim Turks with faith and love.\r\nPray for a deep spiritual hunger among the Turkish, one that can only be satisfied by Jesus Christ, and for a movement of disciples to spread across Turkey and beyond.","Ask the Lord to send out more laborers to work among the Muslim Autrah Jats. \r\nPray that Christian doctors, nurses, and humanitarian aid workers will have opportunities to share the love of Jesus with the Autrah Jats. \r\nAsk God to save key Autrah Jat leaders who will boldly proclaim the gospel to their own people. \r\nPray for a disciple making movement to emerge among every Jat clan and community.","Pray the Lord will give them spiritual hunger, then satisfy that hunger with Christ.\r\nPray these people will understand the value of becoming part of God's royal family.\r\nPray for a Holy Spirit led humility for all Rajput communities to fall at the feet of the King of kings.\r\nPray for a disciple making movement among every Rajput community.\r\nPray for the Lord to bless the Rajputs with His abundant mercy, grace and guidance.","Pray the Lord will give Muslim Chauhan Rajputs a spiritual hunger, then satisfy that hunger.\r\nPray that these Rajputs will understand the value of becoming part of God's royal family.\r\nPray for a Holy Spirit led humility for all Rajput communities to fall at the feet of the King of kings.\r\nPray for a disciple making movement among every Rajput community.","","","Pray for the Ho people to be able to make their own spiritual decisions, free from outside pressures. Pray for a disciple making movement for the Ho people. Pray for their physical needs to be met by the Lord, leading them to put their faith in him alone.","","","Pray that the Kamboh leaders will come to Jesus Christ and lead others to Him. \r\nPray for Kamboh families to be drawn to Jesus and to the Bible to find out more about Him. \r\nPray the Kamboh people will understand that Jesus desires to bless their families and communities, not harm them.","","Pray for the Lord to provide for the physical and spiritual needs of the Arabized Temein people in Sudan.\r\nPray for workers, filled with the love of the Holy Spirit, to go to the Arabized Temein people.\r\nPray for the Arabized Temein people to crave pure spiritual milk and find it in the word of God.\r\nPray for a Holy Spirit directed movement to Christ among the Arabized Temein people.","Pray these people will be rescued from the control of evil forces, and will find full freedom in Christ.","","","Pray that Christian Uzbek leaders would be willing to take Christ to the Uzbeks in Mongolia.\r\nPray that new Uzbek believers would understand God's Word quickly and commit themselves to a local church where they will find strength.\r\nAsk God to grant wisdom and unity to mission agencies focusing on Mongolia.","The Meskhtians have been a persecuted people. Please pray for their well-being as a people, wherever they may live. Pray the Lord will awaken an interest among them to know Jesus in a personal way.","","Pray for believers to train these people in new marketable skills.\r\nPray for spiritual openness among all Bote peoples in Nepal.\r\nPray for a disciple making movement to flourish among them.","Pray for the Jews of Azerbaijan to be open to hearing about their Messiah.\r\nPray for laborers, anointed by the Holy Spirit, who will invest themselves in reaching this precious people group.\r\nTheir location presents a challenge. Scripture resources are available in their languages. Pray for radio and television outreach.\r\nPray for workers willing to take these resources to the mountain villages. Pray they would see much fruit.","Pray for a movement of the Holy Spirit through this unreached people group, that new believers will be discipled, and will disciple others.\r\nPray that strong churches will be planted, and more will grow from existing ones.\r\nPray for Zerma believers in Benin to be adequately discipled and sent out."],"top_values":[["",3405],["Pray the Lord will give them spiritual hunger, then satisfy that hunger with Christ.\r\nPray these people will understand the value of becoming part of God's royal family.\r\nPray for a Holy Spirit led humility for all Rajput communities to fall at the feet of the King of kings.\r\nPray for a disciple making movement among every Rajput community.\r\nPray for the Lord to bless the Rajputs with His abundant mercy, grace and guidance.",88],["Pray that Jat people will have a spiritual hunger that will drive them to seek and find Jesus Christ. Ask the Lord of the harvest to send out laborers filled with the power and the fruit of the Holy Spirit to serve the Jats. Pray for a disciple making movement to emerge among every Jat clan and community in the 2020s.",74],["Pray for the Lord to intervene in their families, calling people to his side.\r\nPray for loving workers.\r\nPray for their hearts to be drawn to the Lord of lords.\r\nPray for a church planting movement to thrive in their communities.",14],["Ask the Holy Spirit to soften the hearts of Bosniaks toward Christ followers so that they will be receptive to the gospel.\r\nPray that God will grant wisdom and favor to the mission agencies that are currently working among Bosnians.\r\nAsk the Lord to call people who are willing to share Christ with Bosniaks.\r\nAsk God to encourage the few known Bosnian believers in this region.\r\nAsk the Lord to raise strong churches among Bosnians that will plant more churches.",12],["Pray for the authority of Christ to bind hindering spiritual forces to lead them from darkness to light.\r\nPray for signs and wonders to happen among them and for great breakthroughs with a rapid multiplication of disciples and house churches.\r\nPray for bold workers who are driven by the love of the Holy Spirit to go to them.\r\nPray for an unstoppable movement to Christ among them.",8],["Pray for families of Beldar believers to become reproducing bodies of Christ, serving those around them with love and compassion. Pray for a chain reaction of Beldar families reaching families that results in thousands of new believers who share their faith with others. Pray that churches and believers will bless their entire people group in such a way that God's love will change the Beldar people like yeast changes dough.",8],["Pray for the authority of Christ to bind hindering spiritual forces to lead them from darkness to light.\r\nPray for signs and wonders among them and for great breakthroughs with a rapid multiplication of disciples and house churches.\r\nPray for bold workers who are driven by the love of the Holy Spirit to go to them.\r\nPray for an unstoppable movement to Christ among them no matter where they live.",6],["Pray for the Lord to intervene in their families, calling people to his side.\r\nPray for loving, anointed workers.\r\nPray for their hearts to be drawn to the Lord of lords.\r\nPray for a church planting movement to thrive in their communities.",5],["Pray the Mandaen diaspora peoples will be able to integrate into the cultures and societies where they now reside, and will be open to new world views.",4],["Pray for Hui culture to be renewed and enhanced by a work of the Holy Spirit and shaped into a God-centered and God-honoring mold.\r\nPray for the Holy Spirit to move among their family and community leaders to seek his face and enjoy his blessings.\r\nPray for the Lord to thrust out workers who will be compelled to nurture a disciple making movement among the Hui people.\r\nPray that soon the Hui people will have faith that will lead them to live honorable lives that will draw others to the savior.",4],["Pray that God will send courageous workers to them and faithful intercessors to pray until they have been discipled in the ways of Jesus.",3],["Pray for the authority of Christ to bind hindering spiritual forces to lead them from darkness to light.\r\nPray for signs and wonders among them and for great breakthroughs with a rapid multiplication of disciples and house churches.\r\nPray for bold workers who are driven by the love of the Holy Spirit to go to them.\r\nPray for an unstoppable movement to Christ among them.",3],["Pray for bold workers who are driven by the love of the Holy Spirit to go to them.\r\nPray for an unstoppable movement to Christ among them.\r\nPray for the authority of Christ to bind hindering spiritual forces to lead them from darkness to light.\r\nPray for signs and wonders to happen among them and for great breakthroughs with a rapid multiplication of disciples and house churches.",3],["Pray for the Banjara community to be able to adequately care for their families, and for widows, orphans, and elderly people to have the care and protection needed.",3],["Pray that a strong movement to Jesus will bring whole Rajput families and communities into a rich experience of God's blessings.",3],["Pray for the Sonar community to be humble enough to acknowledge their need for forgiveness of sin, and that they understand the provision for forgiveness that God has provided.",3],["Pray that a strong movement to Jesus will bring whole Teli families and communities into a rich experience of God's blessing.",3],["Pray for the Lord to provide an abundant harvest for the Bambara as a demonstration of his goodness and power. Pray for a spiritual hunger that will drive the Bambara people into the loving arms of Jesus Christ. Pray for the Lord to thrust out loving ambassadors to the Bambara people in West Africa. Pray for an unstoppable movement to Christ among the Bambara people.",3],["Pray for the Holy Spirit to give the Uzbek people teachable and understanding hearts. Pray for Uzbek families to be drawn by the Holy Spirit to seek forgiveness, and to understand the adequacy of Christ's work on the cross. Pray for a movement of family-based discovery Bible studies.",3]],"top_words":[["the",15176],["to",13361],["for",8513],["and",6652],["of",5588],["pray",5450],["that",4494],["will",3992],["a",3741],["in",3260],["their",2618],["among",2373],["lord",2107],["be",1936],["people",1868],["movement",1740],["them",1610],["jesus",1586],["christ",1502],["would",1393],["with",1357],["they",1287],["holy",1241],["spiritual",1236],["god",1198]],"vocab_skipped":null,"word_histogram":{"counts":[3406,6,66,128,151,252,217,275,279,403,454,352,333,350,162,117,61,48,21,13,11,8,7,1,1,1,0,0,0,1],"edges":[1.0,6.2,11.4,16.6,21.8,27.0,32.2,37.4,42.6,47.800000000000004,53.0,58.2,63.400000000000006,68.60000000000001,73.8,79.0,84.2,89.4,94.60000000000001,99.8,105.0,110.2,115.4,120.60000000000001,125.80000000000001,131.0,136.20000000000002,141.4,146.6,151.8,157.0]}},"kind":"text","n":7124,"n_null":0,"n_unique":3441,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.5169848399775407,"emoji_rate":0.0,"len_max":937,"len_mean":163.06948343627175,"len_median":120.0,"len_min":0,"len_p95":453.84999999999945,"n_duplicates":3683,"n_empty":3405,"one_word_rate":0.4779618192026951,"readability_flesch_mean":32.722027270283796,"url_rate":0.0,"vocab_size":9291,"word_mean":28.230207748455925,"word_median":20.0}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"Resources","extras":{},"kind":"unknown","n":7124,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"country_data","extras":{},"kind":"unknown","n":7124,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"language_data","extras":{},"kind":"unknown","n":7124,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}}],"insights":{"errors":[],"insights":[{"confidence":"high","critiques":[],"evidence_keys":["row_count","column_count","Continent.top_values","AffinityBloc.top_values","Ctry.top_values","PrimaryReligion.top_values","Population.stats","RegionName.top_values","Frontier.top_values","JPScaleText.top_values","LeastReached.top_values","PrimaryLanguageName.top_values"],"featured_charts":[{"caption":"Shows how heavily the dataset concentrates in Asia (~75%) versus other continents.","column":"Continent","kind":"donut"},{"caption":"Highlights that Islam and Hinduism together account for the majority of unreached groups.","column":"PrimaryReligion","kind":"bar"},{"caption":"Breaks the Asia bulk into sub-regions, with Asia South alone covering nearly half the rows.","column":"RegionName","kind":"bar"},{"caption":"Reveals an extreme right-skew \u2014 most groups are small (median 30k) but a few exceed 100M; consider a log scale.","column":"Population","kind":"histogram"},{"caption":"Confirms the South Asian Peoples bloc dominates and shows the next-largest cultural clusters.","column":"AffinityBloc","kind":"bar"}],"model":"anthropic:claude-opus-4-7","narrative":"This dataset is a Joshua Project catalogue of 7,124 unreached people groups described across 109 fields covering geography, language, religion, population, and outreach status. Every row is flagged as 'Unreached' (JPScaleText is constant) and 'LeastReached' is uniformly Y, so the analytical interest sits in the breakdown by region, religion, and population rather than in reach status itself. The data is heavily skewed toward Asia (5,351 of 7,124) and especially South Asian Peoples (3,681), with India alone accounting for 2,032 groups; Islam (3,279) and Hinduism (2,142) dominate PrimaryReligion. Population is extremely long-tailed (median 30,000 vs. max 135.5M, skew ~21), so any size-based analysis should use log scales or medians. Worth a closer look first: the Continent/Region/Country concentration, the religion mix, and the population distribution \u2014 these three together explain most of the dataset's shape.","scope":"dataset","target":"__global__"},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.len_min","stats.len_max","stats.len_mean","stats.allcaps_rate","stats.one_word_rate","stats.vocab_size","stats.n_duplicates","stats.n_empty","top_words","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"PeopleID3ROG3 is almost certainly a person-level identifier: every one of the 7,124 rows holds a unique 7-character, all-caps, single-token code (n_unique equals n, len_min=len_max=7, allcaps_rate=1.0, one_word_rate=1.0). Sample values like '10208ng' and '10375su' suggest a 5-digit numeric prefix followed by a 2-letter suffix. There are no nulls, duplicates, or empties, so the key looks clean.","role":"identifier","scope":"column","target":"PeopleID3ROG3","treatment":"Use as a primary key for joins; exclude from modelling features."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"ROG3 holds two-letter country codes across 7,124 rows with 202 distinct values and no nulls. India (IN) dominates at 28.5% of records, followed by PK (767) and CH (442); the top 10 codes account for the bulk of mass while a long tail of ~190 other codes shares the remainder, giving an entropy ratio of 0.66.","role":"feature","scope":"column","target":"ROG3","treatment":"Group rare codes into an 'other' bucket before one-hot or target encoding."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.skew","stats.kurtosis","stats.zero_rate","stats.n_outliers"],"model":"anthropic:claude-opus-4-7","narrative":"PeopleID3 is an integer key spanning 10120 to 22661 with 4614 unique values across 7124 rows, suggesting a person identifier that recurs (about 1.5 rows per id on average). The distribution is mildly left-skewed (-0.23) and platykurtic (-0.95) with no nulls, no zeros, and no outliers, consistent with a dense allocated id range rather than a measured quantity.","role":"foreign_key","scope":"column","target":"PeopleID3","treatment":"Treat as a join key; do not use as a numeric feature."},{"confidence":"medium","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.skew","stats.std","stats.n_outliers"],"model":"anthropic:claude-opus-4-7","narrative":"ROP3 is a numeric column with 4608 unique values across 7124 rows, ranging tightly from 100005 to 119619 with a mean of 111443.68 and median of 112533. The narrow ~19k span sitting well above zero, combined with integer-looking bounds, suggests a coded identifier or sequence number rather than a measured quantity. Mild left skew (-0.47) and no outliers indicate a fairly uniform spread within that band, and the null rate is negligible at 0.001.","role":"identifier","scope":"column","target":"ROP3","treatment":"Treat as a categorical code or key; do not feed raw into numeric models."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","duplicate_rate","n_duplicates","len_mean","word_mean","one_word_rate","top_values","top_words"],"model":"anthropic:claude-opus-4-7","narrative":"This column names a people group as it appears within a given country (e.g., 'Turk', 'Persian', 'Arab, Moroccan'), likely from a Joshua Project-style ethnographic registry. Values are short (len_mean 12.5, word_mean 1.78) with 4,722 uniques across 7,124 rows, and 33.7% are duplicates because the same people group recurs across countries \u2014 'Deaf' alone appears 151 times. Frequent qualifiers like '(Hindu traditions)' and '(Muslim traditions)' in top_words show religion-tagged variants are baked into the label.","role":"label","scope":"column","target":"PeopNameInCountry","treatment":"Treat as a categorical label; pair with country to form a unique key, and consider stripping parenthetical religion tags for cleaner grouping."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"ROG2 is a low-cardinality categorical with 7 region codes (ASI, AFR, EUR, NAR, LAM, AUS, SOP) and no nulls across 7,124 rows, consistent with a continental/region-of-origin grouping. The distribution is highly imbalanced: ASI accounts for 75.1% of records while AUS and SOP together contribute fewer than 80 rows, yielding an entropy ratio of just 0.45. Any model conditioned on this field will be dominated by the ASI bucket.","role":"feature","scope":"column","target":"ROG2","treatment":"One-hot encode and consider grouping AUS/SOP/LAM into an 'other' bucket given the severe imbalance."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Continent is a low-cardinality geographic categorical with 7 distinct values and no nulls across 7,124 rows. The distribution is heavily concentrated: Asia alone accounts for 75.1% of records, with Africa a distant second at 986. Notably, both 'Australia' (39) and 'Oceania' (36) appear as separate categories, which is a labeling inconsistency since Australia is part of Oceania.","role":"feature","scope":"column","target":"Continent","treatment":"Reconcile Australia/Oceania into a single category, then one-hot encode."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"RegionName is a categorical geographic grouping with 12 distinct regions and no nulls across 7,124 rows. The distribution is heavily concentrated: 'Asia, South' alone accounts for 47.0% of records, followed distantly by 'Asia, Southeast' at 726 and 'Asia, Northeast' at 521, leaving the Americas and Europe sparsely represented. Entropy ratio of 0.76 confirms meaningful but uneven coverage across the 12 buckets.","role":"feature","scope":"column","target":"RegionName","treatment":"One-hot encode and consider grouping rare regions, given the dominance of 'Asia, South'."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"ISO3 looks like a country code in standard 3-letter ISO 3166-1 alpha-3 format, with 202 distinct values across 7,124 rows and zero nulls. The distribution is heavily concentrated on India (IND) at 28.5% of rows (2,032), followed by PAK (767) and CHN (442), so South and East Asia dominate. Entropy ratio of 0.66 confirms the imbalance is material rather than uniform across countries.","role":"foreign_key","scope":"column","target":"ISO3","treatment":"Use as a join key to country reference tables; consider grouping long-tail codes or stratifying by ISO3 to control for the IND-heavy skew."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","language_counts","stats.duplicate_rate","stats.len_max","stats.len_median","stats.vocab_size","top_values","top_words"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text geographic descriptions of where a people group lives within a country, ranging from terse tags like \"Widespread.\" (56 occurrences) to multi-sentence paragraphs up to 939 characters. 64.23% of rows are null and 14.6% of the non-null values are duplicates, so usable signal is concentrated in roughly a third of the dataset. Content is overwhelmingly English (1714 of 1729 detected) with a long tail of place names producing a 10,936-token vocabulary across 2,176 unique strings.","role":"free_text","scope":"column","target":"LocationInCountry","treatment":"Normalize boilerplate phrases like \"Widespread\" into a categorical flag, then tokenize and embed the residual prose before modelling."},{"confidence":"medium","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.median","stats.q1","stats.q3","stats.iqr","stats.skew","stats.outlier_rate","stats.zero_rate"],"model":"anthropic:claude-opus-4-7","narrative":"PeopleID1 is stored as numeric but only takes 16 distinct integer values between 10 and 26, with a tight IQR of 1.0 (Q1=20, Q3=21) around a median of 21. The distribution is heavily left-skewed (skew -1.34) and 32.9% of rows fall outside the Tukey fence, so the 'outliers' alert reflects the column being near-categorical rather than truly continuous. No nulls and no zeros, but the name suggests an identifier despite the low cardinality.","role":"feature","scope":"column","target":"PeopleID1","treatment":"Cast to categorical (16 levels) rather than treating as a continuous numeric."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"ROP1 is a low-cardinality categorical code (16 distinct values, all following an 'A0xx' pattern) with no nulls across 7,124 rows. The distribution is heavily concentrated: 'A012' alone accounts for 51.7% of records, and entropy ratio of 0.67 confirms the imbalance. This looks like a controlled vocabulary or lookup code rather than free input.","role":"feature","scope":"column","target":"ROP1","treatment":"One-hot or target-encode; consider grouping rare codes given the dominance of A012."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"AffinityBloc is a categorical grouping of peoples/ethnolinguistic blocs, with 16 distinct values across 7124 rows and no nulls. The distribution is heavily concentrated: 'South Asian Peoples' alone accounts for 51.7% of records (3681), followed distantly by 'Sub-Saharan Peoples' (632) and 'Arab World' (475). Entropy ratio of 0.67 confirms the imbalance, and the inclusion of 'Deaf' (151) as a bloc alongside geographic/ethnic categories is a notable taxonomy quirk.","role":"feature","scope":"column","target":"AffinityBloc","treatment":"One-hot or target-encode, and consider grouping rare blocs given the dominance of South Asian Peoples."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.skew","stats.kurtosis","stats.zero_rate"],"model":"anthropic:claude-opus-4-7","narrative":"PeopleID2 is a numeric identifier-like field with only 205 distinct values across 7,124 rows, ranging 101 to 475 with no nulls or zeros. The distribution is left-skewed (skew -0.50) and platykurtic (kurtosis -1.24) with median 412 well above the mean 339, suggesting a few low-id clusters pull the mean down while most rows concentrate near the upper end. The low cardinality relative to row count indicates this is a repeated key rather than a per-row unique id.","role":"foreign_key","scope":"column","target":"PeopleID2","treatment":"Treat as a categorical foreign key and left-join to the people dimension rather than using as a numeric feature."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"ROP2 is a categorical code field with 155 distinct values following an A####/C#### pattern, suggesting a classification or routing code. One value, 'A012', dominates at 51.6% of the 7,124 rows, while the remaining categories are long-tailed C-codes each below 2.4%. Entropy ratio of 0.56 confirms the distribution is heavily concentrated rather than uniform.","role":"feature","scope":"column","target":"ROP2","treatment":"Collapse rare C-codes into an 'other' bucket and one-hot or target-encode before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"PeopleCluster is a high-cardinality categorical taxonomy of ethno-religious groupings, with 205 distinct values across 7124 rows and no nulls. The distribution is dominated by South Asian categories \u2014 'South Asia Hindu - other' alone accounts for 12.2% (869 rows), followed by 'South Asia Muslim - other' (586) and 'South Asia Dalit - other' (352). Entropy ratio of 0.80 indicates a fairly spread distribution despite the South Asian skew, and the appearance of 'Deaf' alongside ethnolinguistic labels signals a mixed taxonomy worth flagging.","role":"feature","scope":"column","target":"PeopleCluster","treatment":"Group the long tail and target- or frequency-encode before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","duplicate_rate","n_duplicates","one_word_rate","len_mean","word_median","top_values","top_words"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds people-group / ethnolinguistic names spanning countries (e.g. 'Turk', 'Persian', 'Kurd, Kurmanji', 'Arab, Moroccan'), with frequent religious-tradition qualifiers like '(Hindu traditions)' and '(Muslim traditions)' appearing in 985 and 424 rows respectively. Values are short (mean 12.4 chars, median 2 words) and 47.5% are single-word labels, yet 35.4% (2,520 rows) are duplicates across 4,604 unique strings out of 7,124 \u2014 the same group recurs across countries. The most surprising entry is 'Deaf' at 151 occurrences, which sits oddly alongside ethnic categories.","role":"label","scope":"column","target":"PeopNameAcrossCountries","treatment":"Treat as a categorical people-group label; normalize qualifiers in parentheses and join on (group, country) for cross-country aggregation."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.median","stats.mean","stats.q1","stats.q3","stats.skew","stats.kurtosis","stats.outlier_rate","stats.zero_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Population counts per record, ranging from 10 to 135,533,000 with a median of just 30,000. The distribution is extraordinarily right-skewed (skew 21.1, kurtosis 607) \u2014 the mean of ~502,570 sits far above Q3 of 129,000, and ~14.9% of rows flag as outliers, suggesting a mix of small localities with a few country- or megacity-scale entries. Null rate is negligible (0.21%) and there are no zeros.","role":"feature","scope":"column","target":"Population","treatment":"Apply a log1p transform before any modelling to tame the extreme skew."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Three-level categorical with values \"1\", \"2\", \"3\" and no nulls across 7124 rows. Distribution is imbalanced: \"3\" dominates at 60.3% (4299), \"1\" follows at 2330, and \"2\" is rare at 495. Entropy ratio of 0.78 confirms the skew toward the majority class.","role":"label","scope":"column","target":"Category","treatment":"Treat as a categorical label; consider class weighting or stratified sampling to handle the minority class \"2\"."},{"confidence":"high","critiques":[],"evidence_keys":["len_min","len_max","len_mean","one_word_rate","n_unique","n","duplicate_rate","top_values","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"ROL3 holds three-letter ISO 639-3 language codes \u2014 every value is exactly 3 characters and one word, with top entries like 'hin', 'ben', 'urd', 'guj', and 'tel' pointing to South Asian languages. The distribution is heavily skewed toward Hindi (662 of 7124) and only 1565 unique codes appear across 7124 rows, giving a 78% duplicate rate. No nulls, no empties, no formatting noise.","role":"feature","scope":"column","target":"ROL3","treatment":"treat as a categorical language code; one-hot or target-encode, and consider grouping rare codes."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.duplicate_rate","stats.one_word_rate","stats.word_mean","stats.vocab_size","top_values","top_words"],"model":"anthropic:claude-opus-4-7","narrative":"Categorical language label, almost always a single word (one_word_rate 0.70, word_mean 1.33) drawn from a vocabulary of 1,641 tokens across 1,563 distinct values. Hindi (662), Bengali (357), and Sindhi (191) dominate the 7,124 rows, and 78.1% of values are duplicates of an earlier row \u2014 expected for a controlled language taxonomy. Compound names like 'Pashto, Northern' and 'Punjabi, Eastern' indicate ISO-style subvariant naming rather than free text.","role":"feature","scope":"column","target":"PrimaryLanguageName","treatment":"Treat as a categorical factor; normalise the comma-separated subvariants before one-hot or target encoding."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text or controlled-vocabulary field naming a primary language dialect, with 303 distinct values across 7124 rows but populated in only 5.5% of records (null_rate 0.945). Distribution is essentially flat \u2014 entropy_ratio 0.97 and the modal value 'Punjabi' covers just 3.1% of non-nulls (12 occurrences) \u2014 so no dialect dominates. The mix spans South Asian, Middle Eastern, African, and European dialects, suggesting a global but extremely sparse roster.","role":"metadata","scope":"column","target":"PrimaryLanguageDialect","treatment":"Drop or collapse into a coarser language grouping; too sparse and high-cardinality to use directly as a feature."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.q1","stats.q3","stats.skew","stats.kurtosis","stats.n_outliers","stats.outlier_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Counts the number of languages spoken, with values ranging from 1 to 120 across 7,124 rows and no nulls. The distribution is heavily right-skewed (skew 4.87, kurtosis 36.3): the median is 1 and Q3 is 5, yet the mean is 4.33 and 597 rows (8.4%) flag as outliers, suggesting a long tail of implausibly high counts up to 120.","role":"feature","scope":"column","target":"NumberLanguagesSpoken","treatment":"Cap or log-transform before modelling, and audit the extreme tail (values up to 120) for data-entry errors."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Categorical column listing an official language per record, with 79 distinct values across 7124 rows and effectively no nulls (0.08%). Hindi dominates at 28.5% (2032 rows), followed by Urdu (767), Standard Arabic (657), Mandarin (475), and English (433), giving an entropy ratio of 0.66 \u2014 moderately concentrated rather than uniform. The South/Central Asian skew is notable: five of the top ten values are languages of that region, which may bias any downstream language-level analysis.","role":"feature","scope":"column","target":"OfficialLang","treatment":"Group rare languages into an 'Other' bucket and one-hot or target-encode before modelling."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","n","null_rate","kind"],"model":"anthropic:claude-opus-4-7","narrative":"Column 'SpeakNationalLang' was skipped by the profiler, so type, cardinality and value distribution are all unavailable. The only confirmed facts are that it has 7124 rows and zero nulls. The name suggests a flag or category for whether a respondent speaks the national language, but this cannot be verified from the evidence.","role":"other","scope":"column","target":"SpeakNationalLang","treatment":"Re-profile with type inference enabled before deciding on any downstream handling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.q1","stats.q3","stats.skew","stats.outlier_rate","stats.zero_rate"],"model":"anthropic:claude-opus-4-7","narrative":"BibleStatus is an ordinal/categorical code stored as a small integer, taking just 6 distinct values from 0 to 5 across 7,124 rows with no nulls. The distribution is heavily concentrated at the top (median 5, Q1=4, Q3=5, mean 4.05) with strong negative skew (-1.51), and 13.5% of rows flagged as low-end outliers plus a 3.8% zero rate. This looks like a status/level code rather than a true numeric measurement.","role":"feature","scope":"column","target":"BibleStatus","treatment":"Treat as an ordinal category (or one-hot encode) rather than a continuous numeric."},{"confidence":"medium","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"BibleYear appears to be a publication/edition year field for Bible translations, encoded mostly as date ranges like \"1818-2022\" rather than single years. Cardinality is high (163 distinct values across 7124 rows) and the column is missing for 45.79% of rows, which is a major coverage gap. The top value \"1818-2022\" covers 17.14% of non-nulls and most frequent entries are spans, while plain single years like \"1954\" (191 occurrences) are the exception.","role":"metadata","scope":"column","target":"BibleYear","treatment":"Parse into start_year and end_year integers, then decide imputation given the 45.79% null rate."},{"confidence":"medium","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"NTYear appears to hold year-range strings (e.g. \"1811-1998\", \"1801-1984\") indicating a span between two dates, though the presence of \"Yes\" as the third most common value (345 rows) signals encoding inconsistency. The column has 305 distinct values across 7124 rows with a high null rate of 24.65%, and the top value covers only 12.3% of non-nulls, so the distribution is fairly spread (entropy ratio 0.735).","role":"feature","scope":"column","target":"NTYear","treatment":"Parse year-range strings into start/end numeric fields and quarantine non-conforming values like \"Yes\" before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"PortionsYear appears to be a free-form field describing the year range covered by record portions, with 460 distinct values across 7124 rows and a 13.5% null rate. Most entries are date ranges like '1806-1962' or '1800-1980', but the single most common value is the literal string 'Yes' (821 rows, 13.3%), suggesting inconsistent data entry where a yes/no answer leaks into a date-range field. High entropy ratio (0.71) confirms values are spread across many ranges rather than concentrated.","role":"metadata","scope":"column","target":"PortionsYear","treatment":"Parse date ranges into start/end year numerics and isolate the 'Yes' contamination as a separate boolean flag before use."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","n_unique","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column \"TranslationNeedQuestionable\" was skipped by the profiler, so no type, uniqueness, or value statistics are available. All we know is that it has 7124 rows with a 0.0 null rate; nothing else can be inferred from the evidence.","role":"other","scope":"column","target":"TranslationNeedQuestionable","treatment":"Re-profile or inspect manually before deciding on use; current evidence is insufficient."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.std","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"JPScale is a numeric column that is entirely constant: all 7124 rows hold the value 1.0 with zero nulls, zero variance, and a single unique value. It carries no information for any downstream model or comparison and was flagged as constant.","role":"metadata","scope":"column","target":"JPScale","treatment":"Drop; constant column with no variance."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"JPScalePC is a 5-level categorical code (values \"1\" through \"5\") with no nulls across 7124 rows, likely an ordinal scale or rating. The distribution is heavily concentrated at \"1\" (70.2% of rows), with \"3\" the rarest at just 205 occurrences, yielding an entropy ratio of 0.59. The non-monotonic frequency order (1 > 4 > 2 > 5 > 3) is unusual for a true ordinal scale and worth checking.","role":"feature","scope":"column","target":"JPScalePC","treatment":"Treat as ordinal categorical; consider grouping minority levels (3, 5) given the dominance of \"1\"."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"JPScalePGAC is a 5-level categorical code (values \"1\" through \"5\"), likely a Japanese seismic intensity / PGA scale rating. The distribution is severely imbalanced: \"1\" accounts for 6910 of 7124 rows (top_rate 0.97), entropy_ratio is just 0.10, and the remaining four levels together hold under 220 records. No nulls are present.","role":"feature","scope":"column","target":"JPScalePGAC","treatment":"Collapse rare levels or binarise as \"1\" vs other before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column is a single-valued categorical flag holding \"Y\" for all 7124 rows, with no nulls and zero entropy. Because cardinality is 1 and top_rate is 1.0, it carries no information for any downstream model.","role":"metadata","scope":"column","target":"LeastReached","treatment":"Drop; constant column with no variance."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Binary Y/N flag indicating whether some 'least reached' people-group condition is met. The column is fully populated across 7124 rows with only 2 distinct values, skewed toward 'Y' at 72.3% (5152) versus 'N' at 1972. Entropy ratio of 0.85 shows the split is uneven but still informative.","role":"feature","scope":"column","target":"LeastReachedPC","treatment":"Encode as a 0/1 boolean for modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"A binary Y/N flag (likely indicating whether the least-reached PGAC condition was met) with no nulls across 7124 rows. The distribution is severely imbalanced: 'Y' accounts for 6910 rows (97.0%) versus only 214 'N', yielding entropy_ratio of just 0.19. As a near-constant feature it carries little discriminative signal on its own.","role":"feature","scope":"column","target":"LeastReachedPGAC","treatment":"Encode as 0/1 but consider dropping or pairing with rare-class oversampling given the 97/3 imbalance."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","top_values","stats.cardinality","stats.entropy_ratio"],"model":"anthropic:claude-opus-4-7","narrative":"GSEC is a low-cardinality categorical with 8 distinct values across 7124 rows and no nulls. The dominant value is the empty string at 51.08% (3639 rows), followed by '1' at 2767; the remaining codes ('0' through '6') together account for under 10% of rows. The mix of blanks and small integer codes suggests an optional categorical flag where 'missing' is encoded as '' rather than null.","role":"feature","scope":"column","target":"GSEC","treatment":"Recode '' as explicit missing and one-hot encode the remaining small-integer categories."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Binary Y/N flag indicating whether a record has associated audio recordings. The class is heavily imbalanced toward 'Y' at 86.9% (6188 of 7124), with no nulls. Entropy ratio of 0.56 confirms the skew but the minority 'N' class still has 936 observations, enough to be usable.","role":"feature","scope":"column","target":"HasAudioRecordings","treatment":"Encode as a 0/1 boolean; watch for class imbalance if used as a target."},{"confidence":"high","critiques":[],"evidence_keys":["n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"NTOnline is a categorical flag with only one observed value, 'Y', across 5528 non-null rows, while 22.4% of rows are null. With cardinality 1 and entropy 0, it carries no discriminative signal\u2014presence vs. absence is the only information available.","role":"feature","scope":"column","target":"NTOnline","treatment":"Drop, or replace with a binary is_present indicator if the null pattern is meaningful."},{"confidence":"high","critiques":[],"evidence_keys":["n_unique","min","max","median","q1","q3","iqr","skew","outlier_rate","n_outliers","std","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"RLG3 is a discrete numeric column with only 7 unique values spanning 2 to 9, suggesting an ordinal rating or Likert-style scale rather than a continuous measurement. The distribution is tight around the median of 6 (IQR=1, Q1=5, Q3=6) with mild left skew (-0.46), but 10.6% of rows (757) fall outside the IQR fences \u2014 an artifact of the narrow box rather than true anomalies.","role":"feature","scope":"column","target":"RLG3","treatment":"Treat as an ordinal categorical; the outlier flag is a side-effect of the compressed IQR, not bad data."},{"confidence":"high","critiques":[],"evidence_keys":["n_unique","min","max","q1","q3","median","iqr","skew","outlier_rate","n_outliers","null_rate","zero_rate"],"model":"anthropic:claude-opus-4-7","narrative":"RLG3PC is an integer-coded ordinal feature with only 8 distinct values spanning 1-9 and a tight IQR of 1 (Q1=5, Q3=6). The distribution is left-skewed (-0.95) and concentrated around the median of 5, yet 14.3% of rows (1022) fall outside the IQR fence, suggesting a heavy lower tail rather than true anomalies. No nulls or zeros are present.","role":"feature","scope":"column","target":"RLG3PC","treatment":"Treat as an ordinal/categorical scale rather than continuous; the outlier rate reflects skew, not errors."},{"confidence":"high","critiques":[],"evidence_keys":["n_unique","min","max","median","q1","q3","iqr","mean","std","skew","kurtosis","n_outliers","outlier_rate","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"RLG3PGAC is a numeric column with only 8 distinct integer values spanning 1 to 9, suggesting an ordinal rating or Likert-style score rather than a continuous measurement. The distribution is tight around a median of 5.5 with IQR of just 1 (Q1=5, Q3=6), yet 776 rows (10.9%) fall outside the Tukey fence, indicating a heavy-tailed concentration where any deviation from the central 5-6 band registers as an outlier. Mild left skew (-0.46) hints that low scores are slightly more common than the symmetric mean of 5.27 would suggest.","role":"feature","scope":"column","target":"RLG3PGAC","treatment":"Treat as ordinal categorical; bin or one-hot encode rather than scaling as continuous."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"PrimaryReligion is a low-cardinality categorical with 7 distinct values across 7,124 rows and no nulls. Islam dominates at 46% (3,279 rows), followed by Hinduism (2,142) and Ethnic Religions (933); Non-Religious appears only 13 times and 157 rows are explicitly 'Unknown'. Entropy ratio of 0.68 indicates a moderately skewed but not degenerate distribution.","role":"feature","scope":"column","target":"PrimaryReligion","treatment":"One-hot encode and consider merging 'Unknown' with 'Other / Small' or treating it as a missing-value flag."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Categorical label assigning each of 7124 rows to one of 8 primary religion categories, with no nulls. Islam dominates at 3105 rows (43.6%) followed by Hinduism at 2296, while Non-Religious (35) and Other/Small (62) are rare; entropy ratio of 0.68 indicates moderate concentration in the top two classes. 154 rows are explicitly 'Unknown', a category worth treating distinctly from missing.","role":"feature","scope":"column","target":"PrimaryReligionPC","treatment":"One-hot encode the 8 levels and keep 'Unknown' as its own category rather than imputing."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Categorical label for the primary religion of a People Group Across Countries (PGAC) record, with 8 distinct values across 7124 rows and no nulls. Islam dominates at 45.6% (3247), followed by Hinduism (2154) and Ethnic Religions (925); Christianity is strikingly rare at just 17 rows, which is notable for a religion-coded dataset. Entropy ratio of 0.65 indicates moderate concentration on the top categories.","role":"feature","scope":"column","target":"PrimaryReligionPGAC","treatment":"One-hot or target-encode for modelling; consider folding 'Unknown' and 'Non-Religious'/'Christianity' tails into 'Other'."},{"confidence":"medium","critiques":[],"evidence_keys":["null_rate","n_unique","stats.min","stats.max","stats.mean","stats.median","stats.skew","stats.iqr","stats.n_outliers","stats.outlier_rate"],"model":"anthropic:claude-opus-4-7","narrative":"RLG4 is a sparse numeric feature populated for only ~7.6% of rows (null_rate 0.9239) with just 18 distinct integer-like values ranging 10 to 39. The distribution is right-skewed (skew 1.05, mean 18.19 vs median 20.0) with 30 flagged outliers (5.5% of present values) and a tight IQR of 6. The combination of heavy nullness and a bounded, discrete value set suggests an ordinal score or category code recorded only in specific cases.","role":"feature","scope":"column","target":"RLG4","treatment":"Add a missingness indicator and impute or bin before modelling, given 92% nulls and a small discrete value set."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"A sub-classification of religion (denomination/sect), with 18 distinct values like Sunni, Judaism, Sikhism, Tibetan, and Theravada. The column is 92.39% null, so it is only populated for the small subset of records where a finer-grained religious branch applies. Among the 7124 rows, Sunni leads at 29.52% of non-null values (160 occurrences), and entropy ratio 0.72 indicates the populated values are spread fairly evenly across branches.","role":"feature","scope":"column","target":"ReligionSubdivision","treatment":"Treat missingness as its own category and one-hot encode, or roll up into the parent Religion field before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["stats.min","stats.max","stats.mean","stats.median","stats.q1","stats.q3","stats.iqr","stats.std","stats.kurtosis","stats.skew","stats.zero_rate","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"PCIslam appears to be a percentage-style indicator of Islamic affiliation, bounded between 0 and 100 with a near-zero null rate (0.0013). The distribution is starkly bimodal rather than continuous: 47.1% of rows are exactly zero, the median is 0.28, yet Q3 sits at 99.99, producing a kurtosis of -1.93 and an IQR spanning nearly the full range. Mean (45.2) and std (48.2) confirm the mass is piled at the extremes rather than around the center.","role":"feature","scope":"column","target":"PCIslam","treatment":"Treat as bimodal: consider binarizing (0 vs >0) or binning rather than using raw value in linear models."},{"confidence":"high","critiques":[],"evidence_keys":["zero_rate","median","q1","q3","max","mean","skew","kurtosis","n_outliers","outlier_rate","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"PCNonReligious appears to be the percentage of non-religious individuals in each record, but the distribution is dominated by zeros \u2014 87.5% of values are exactly 0 and the entire IQR collapses to 0. The remaining tail stretches to 99.0 with skew of 9.1 and kurtosis of 125.3, producing 886 outliers (12.5% of rows). Mean (1.02) sits far above median (0), so any modelling that assumes symmetry will be misled.","role":"feature","scope":"column","target":"PCNonReligious","treatment":"Treat as zero-inflated; consider a binary is_nonzero flag plus a log1p transform of the positive tail."},{"confidence":"high","critiques":[],"evidence_keys":["stats.zero_rate","stats.min","stats.max","stats.median","stats.q1","stats.q3","stats.skew","stats.kurtosis","stats.n_outliers","stats.outlier_rate","n_unique","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"PCUnknown is a numeric column expressing what looks like a percentage (range 0-100) of 'unknown' classification, with 92.8% of values being zero and a median/Q1/Q3 all at 0. The distribution is extremely right-skewed (skew 6.45, kurtosis 39.85) with 510 outliers (7.2%) extending up to 100. With 388 unique values and only 0.35% nulls, it carries sparse but potentially meaningful signal in the long tail.","role":"feature","scope":"column","target":"PCUnknown","treatment":"Binarize (zero vs non-zero) or log-transform the non-zero tail before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.q1","stats.q3","stats.iqr","stats.skew","stats.zero_rate","stats.outlier_rate","stats.n_outliers"],"model":"anthropic:claude-opus-4-7","narrative":"SecurityLevel is an ordinal/categorical code stored as numeric, with only 3 distinct values spanning 0 to 2 across 7,124 complete rows. The distribution is heavily concentrated at the top tier (median, Q1, and Q3 all equal 2.0, mean 1.595), yet 15.6% of rows are 0 and the IQR-based outlier check flags 24.9% of records \u2014 an artifact of the degenerate IQR of 0 rather than true anomalies. Strong negative skew (-1.47) confirms the mass sits at level 2.","role":"feature","scope":"column","target":"SecurityLevel","treatment":"Treat as a 3-level ordinal category (one-hot or ordered encode); ignore the outlier flag since IQR is zero."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Binary Y/N flag indicating membership in some 'LRTop100' set, with exactly 100 rows marked 'Y' out of 7124 \u2014 strongly suggesting a curated top-100 list. The distribution is severely imbalanced (98.6% 'N', entropy ratio 0.107), which is flagged as an imbalance alert. No nulls are present.","role":"label","scope":"column","target":"LRTop100","treatment":"Use as a binary indicator; if modelling, apply class-imbalance handling (stratification or reweighting)."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","stats.one_word_rate","stats.len_max","stats.duplicate_rate","stats.n_empty","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"PhotoAddress holds single-token image filenames following a 'pXXXXX.jpg' pattern (one_word_rate 1.0, len_max 13). Coverage is poor: 1970 of 7124 rows are empty strings and duplicate_rate is 0.596, so the same photo is reused across many records (e.g., p19007.jpg appears 90 times). Only 2880 unique values back 7124 rows, suggesting shared stock images or a many-to-one photo lookup rather than a per-row asset.","role":"metadata","scope":"column","target":"PhotoAddress","treatment":"Treat as a file reference: drop from modelling, or join to an image table after handling the ~1970 empty strings."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"PhotoCredits captures the attribution string for an associated image, with 851 distinct credits across 7124 rows. The column is dominated by missing-style values: 1970 rows (27.7%) are empty strings and another 1496 are 'Anonymous', so over half lack a real attribution. The remaining tail is long and idiosyncratic, mixing organisations ('Operation China, Asia Harvest'), individuals ('Isudas', 'Kerry Olson'), and platform tags ('Steve Evans - Flickr').","role":"metadata","scope":"column","target":"PhotoCredits","treatment":"Treat empty and 'Anonymous' as missing and keep only as provenance metadata; do not use as a model feature."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"URL string crediting the source of an associated photo, dominated by a single domain (asiaharvest.org appears 443 times) alongside a long tail of 774 distinct values. 36% of rows are null and another 43.21% are empty strings \u2014 together roughly four out of five rows carry no usable credit. Remaining values mix organisational sites (newcovenantmissions, createinternational), shorteners (tinyurl), and stock-photo hosts (pixabay, pxhere, flickr).","role":"metadata","scope":"column","target":"PhotoCreditURL","treatment":"Drop for modelling; if provenance matters, parse to domain and treat as a low-coverage attribution field."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Binary Y/N flag indicating whether a photo carries a Creative Commons licence. The vast majority (top_rate 0.7981) are 'N' with only 1437 'Y' values, and nulls are negligible (null_rate 0.0007). Class imbalance is notable but not extreme.","role":"feature","scope":"column","target":"PhotoCreativeCommons","treatment":"Encode as a 0/1 boolean; impute the handful of nulls with the mode 'N'."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Binary Y/N flag indicating whether a photo carries copyright restrictions, with 'N' dominating at 80.6% of 7,124 rows and only 2 unique values. Nulls are negligible (0.17%) and entropy ratio of 0.71 reflects the moderate class imbalance. No anomalies beyond the expected skew toward unrestricted photos.","role":"feature","scope":"column","target":"PhotoCopyright","treatment":"Encode as a boolean (Y=1, N=0) and impute the handful of nulls with the mode."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","top_values","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"Binary opt-in flag for photo permission, stored as 'Y'/'N'. The column is heavily skewed toward 'N' at 80.4% (5715 of 7124), with a near-zero null rate of 0.2%. Watch the case inconsistency: 2 records use lowercase 'y' alongside 1393 uppercase 'Y', so case-sensitive joins or filters will miscount.","role":"feature","scope":"column","target":"PhotoPermission","treatment":"Normalize case (upper) and encode as boolean before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"A binary flag indicating whether a profile text exists, with values Y/N. The column is severely imbalanced: 6888 of 7124 rows (96.7%) are Y, leaving only 236 N, yielding a low entropy ratio of 0.21.","role":"feature","scope":"column","target":"ProfileTextExists","treatment":"Encode as a 0/1 indicator but expect minimal predictive signal due to severe class imbalance."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.q1","stats.q3","stats.skew","stats.kurtosis","stats.outlier_rate","stats.n_outliers","stats.std"],"model":"anthropic:claude-opus-4-7","narrative":"Likely a per-row count of distinct countries associated with each record, ranging from 1 to 164 across 7124 rows with no nulls. The distribution is severely right-skewed (skew 5.67, kurtosis 33.17): the median is just 2 and Q3 is 4, yet the mean is 8.11 and 16.98% of rows flag as outliers. A long tail of high-country records is dragging the mean far above typical values.","role":"feature","scope":"column","target":"CountOfCountries","treatment":"Log-transform or cap at a high quantile before modelling to tame the heavy right tail."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","column","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"Saturn skipped profiling on CountOfProvinces, so beyond a row count of 7124 and zero nulls, no distributional evidence is available. The name suggests an integer count of provinces per record, but unique count, range, and summary stats are all missing. Without further inspection the column's actual content and cardinality cannot be confirmed.","role":"other","scope":"column","target":"CountOfProvinces","treatment":"Re-profile or manually inspect this column before use; saturn skipped it."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","mean","median","skew","q1","q3","n_outliers","outlier_rate","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"Geographic longitude coordinates spanning the full global range from -173.08 to 178.44 degrees. The distribution is heavily left-skewed (-1.40) with a median of 75.23 sitting well above the mean of 62.80, suggesting concentration in eastern hemisphere locations with a tail of western-hemisphere points. About 4.4% of values (316 rows) fall outside the typical IQR range.","role":"feature","scope":"column","target":"Longitude","treatment":"Pair with latitude for geospatial features; consider clustering or binning rather than treating as a raw scalar."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.skew","stats.n_outliers","stats.outlier_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Latitude values for 7124 rows spanning -42.61 to 71.84 with a median of 25.02 \u2014 consistent with geographic latitudes in degrees. Distribution leans toward northern hemisphere (mean 23.54, skew -0.70) with 292 outliers (4.1%) likely representing far-southern or far-northern records. No nulls and 6696 unique values suggest near-record-level coordinates.","role":"feature","scope":"column","target":"Latitude","treatment":"Pair with longitude for geospatial features; avoid standard scaling alone since latitude is bounded and non-linear in distance."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Country-of-origin or location field with 202 distinct values across 7,124 rows and zero nulls. India dominates at 28.5% (2,032 rows), followed by Pakistan (767) and China (442); the long tail spans 200+ countries with entropy ratio 0.66, indicating concentrated but globally distributed coverage. The South/Central Asia skew is the headline surprise \u2014 five of the top six values are Asian.","role":"feature","scope":"column","target":"Ctry","treatment":"Group rare countries into an 'Other' bucket or encode by region before modelling to avoid 200-way one-hot blow-up."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"A binary Y/N flag indicating Indigenous status, fully populated across all 7124 rows. The distribution is imbalanced: 'Y' accounts for 79.4% (5657 rows) versus 1467 'N' rows, which is a notable skew to keep in mind for any stratified analysis.","role":"feature","scope":"column","target":"IndigenousCode","treatment":"Encode as a binary indicator and watch for class imbalance when used as a predictor or stratifier."},{"confidence":"medium","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"PercentAdherents appears to be a numeric measure (likely a percentage or rate of religious adherents) stored as strings, with 692 distinct values across 7,124 rows and no nulls. It is dominated by '0.000', which accounts for 56.2% of records, and the long tail of small integer- and decimal-valued strings drives entropy down to a ratio of 0.43. The format mixing whole numbers like '5.000' with fractions like '0.200' suggests these are raw values rather than binned categories.","role":"feature","scope":"column","target":"PercentAdherents","treatment":"Cast to float and treat as a zero-inflated numeric feature rather than a category."},{"confidence":"medium","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Stored as a categorical but the 184 distinct values are numeric strings ranging from '0.000' to figures like '8.571', suggesting this is a percent-Christian metric (likely per-capita or per-county) cast as text. The distribution is concentrated: '0.482' alone covers 12.2% of 7124 rows and the top 10 values account for a large share, yet entropy ratio of 0.79 indicates the long tail still carries information. No nulls, but the repeated exact decimals hint at a lookup or pre-binned source rather than raw measurements.","role":"feature","scope":"column","target":"PercentChristianPC","treatment":"cast to float and treat as a continuous feature; investigate the heavy spike at 0.482 before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.duplicate_rate","stats.n_duplicates","stats.one_word_rate","stats.len_mean","stats.word_mean","stats.word_median","top_values","top_words"],"model":"anthropic:claude-opus-4-7","narrative":"Short ethnonym/community labels (e.g., 'Deaf', 'Turk', 'Persian', 'Japanese'), averaging 11.8 characters and 1.7 words with a median of 2 words. About 34% of rows are duplicates (2,419) and ~49% are single-word entries, with 4,705 unique values across 7,124 rows. Surprising signals: 'Deaf' tops the list at 151 occurrences, and top words include parenthetical religious qualifiers like 'traditions)', '(hindu', '(muslim' (952/477/411), suggesting many entries carry trailing tradition tags that the tokenizer split awkwardly.","role":"label","scope":"column","target":"NaturalName","treatment":"Normalize casing and strip parenthetical tradition suffixes, then treat as a categorical label."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.one_word_rate","stats.word_mean","stats.len_mean","stats.duplicate_rate","stats.n_duplicates","top_values","top_words"],"model":"anthropic:claude-opus-4-7","narrative":"Phonetic respellings of ethnonyms \u2014 short hyphenated pronunciation guides like 'PUR-zhun', 'jae-puh-NEEZ', and 'pahsh-TOON' \u2014 accompanying some other label column. Values are overwhelmingly single tokens (one_word_rate 0.73, word_mean 1.28, len_mean 10.8) and 48.5% are null, so coverage is partial. Duplicates dominate (n_duplicates 2183, duplicate_rate 0.59) with only 1489 unique forms across 7124 rows, suggesting a small controlled vocabulary repeated across records.","role":"metadata","scope":"column","target":"NaturalPronunciation","treatment":"Treat as an optional pronunciation lookup keyed to the parent term; drop or impute before modelling given ~48% nulls."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","stats.cardinality","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to be a percentage or count of Christians (PGAC suggesting a per-group/area Christian metric), stored as strings with three-decimal precision rather than as a numeric type. It is heavily zero-inflated: '0.000' accounts for 43.8% of the 7,124 rows (3,121 occurrences), and a suspiciously specific value '3.733' is the second mode at 151 rows. With 842 distinct values and entropy ratio 0.58, the distribution is concentrated but long-tailed, and the null rate is negligible at 0.07%.","role":"feature","scope":"column","target":"PercentChristianPGAC","treatment":"Cast to numeric and consider a zero-inflated transform (e.g., log1p with a zero indicator) before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"PercentEvangelical reads as a numeric share of evangelicals stored as strings, with 401 distinct values across 7124 rows. The distribution is heavily zero-inflated: 65.7% of rows are exactly \"0.000\" and another 10.4% are null, leaving a long tail of small fractions like 0.100, 0.200, 0.500. Entropy ratio of 0.364 confirms most of the signal collapses onto that single zero bucket.","role":"feature","scope":"column","target":"PercentEvangelical","treatment":"Cast to float, impute the 10.4% nulls, and consider a zero-vs-nonzero indicator alongside the raw value to handle the zero inflation."},{"confidence":"medium","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"PercentEvangelicalPC appears to be a numeric percentage (likely an evangelical population share, possibly per capita or principal-component scaled) that has been stored as strings, yielding 166 distinct values across 7124 rows with a 2.15% null rate. The distribution is concentrated: the top value '0.199' covers 12.47% of rows, and the leading entries cluster near zero ('0.095', '0.000', '0.004') yet some values reach above 3 ('3.409', '3.339'), suggesting a long right tail or mixed scale. Entropy ratio of 0.78 indicates moderate concentration rather than uniformity.","role":"feature","scope":"column","target":"PercentEvangelicalPC","treatment":"Cast to float, impute the ~2% nulls, and consider log or rank transform given the right-tailed values."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Numeric percentages (likely share of evangelical population per PGAC unit) stored as strings, hence profiled as categorical with 548 distinct values. The distribution is heavily zero-inflated: '0.000' accounts for 48.9% of 7124 rows, with a curious secondary spike at '1.801' (151 rows) that doesn't fit a percentage interpretation cleanly. Null rate is 6.32% and entropy ratio is 0.55, consistent with a long tail of small fractional values.","role":"feature","scope":"column","target":"PercentEvangelicalPGAC","treatment":"Cast to float, impute or flag nulls, and consider a zero-indicator plus log/sqrt transform given the heavy zero mass."},{"confidence":"high","critiques":[],"evidence_keys":["stats.min","stats.max","stats.mean","stats.median","stats.q1","stats.q3","stats.iqr","stats.zero_rate","stats.outlier_rate","stats.skew","stats.kurtosis","stats.std","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"PCBuddhism appears to be a percentage feature measuring the Buddhist share of some unit (likely a postcode or area), ranging 0 to 100 with mean 6.41. The distribution is extremely zero-inflated: 82.99% of rows are exactly 0, the entire IQR collapses to 0, and yet 17.01% of rows are flagged as outliers with skew 3.48 and kurtosis 10.56. This means Buddhism is rare across most areas but reaches sizeable concentrations in a long tail.","role":"feature","scope":"column","target":"PCBuddhism","treatment":"Treat as zero-inflated proportion: add a presence indicator and log1p-transform the non-zero tail before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.std","stats.q1","stats.q3","stats.iqr","stats.skew","stats.kurtosis","stats.zero_rate","stats.outlier_rate","stats.n_outliers","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"PCEthnicReligions is a numeric percentage-style feature (0\u2013100) capturing the share of some ethnic-religion category, likely per record/region. It's overwhelmingly zero \u2014 78% of values are 0 and the entire interquartile range collapses to 0 \u2014 yet the mean is 13.1 with std 30.7, indicating a small set of records carry very large shares. Skew of 2.16 and a 22% outlier rate confirm a sparse, heavy-tailed distribution rather than a smooth continuum.","role":"feature","scope":"column","target":"PCEthnicReligions","treatment":"Binarize (zero vs non-zero) or apply a zero-inflated/log1p transform before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","mean","median","q1","q3","zero_rate","skew","kurtosis","n_unique","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to be the percentage share of Hindus in some geographic or demographic unit, ranging from 0 to 100 with a mean of 29.8. The distribution is strongly bimodal in spirit: 67.7% of rows are exactly zero while Q3 sits at 98.4, indicating most units have no Hindu presence and a substantial minority are nearly entirely Hindu. Skew is 0.87 and kurtosis -1.22, consistent with this U-shaped split rather than a single peak.","role":"feature","scope":"column","target":"PCHinduism","treatment":"Consider a zero-vs-nonzero indicator plus the raw percentage, since a flat numeric treatment will hide the bimodal structure."},{"confidence":"high","critiques":[],"evidence_keys":["zero_rate","q1","q3","iqr","max","mean","std","skew","kurtosis","n_outliers","outlier_rate","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"PCOtherSmall is a numeric feature where 88% of rows are zero and the IQR is zero, meaning the bottom three quartiles are all 0. The remaining mass stretches up to 100 with mean 1.84 and std 12.33, producing severe right skew (7.39) and very heavy tails (kurtosis 54.18). About 12% of rows (851) flag as outliers, suggesting this is a sparse share/percentage indicator that fires only for a small subset of records.","role":"feature","scope":"column","target":"PCOtherSmall","treatment":"Binarize presence (>0) or apply log1p before modelling to tame the skew."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.median","stats.iqr","stats.skew","stats.n_outliers","stats.outlier_rate"],"model":"anthropic:claude-opus-4-7","narrative":"RegionCode holds 12 distinct integer values from 1 to 12 with no nulls, so it is almost certainly a categorical region identifier stored as a number rather than a true numeric measure. The distribution is concentrated around the median of 4 with an IQR of just 2, yet the right skew of 1.12 and 601 flagged outliers (8.4%) reflect the long tail of higher-numbered regions rather than genuine anomalies.","role":"feature","scope":"column","target":"RegionCode","treatment":"Cast to categorical and one-hot or target-encode; do not treat as a continuous numeric."},{"confidence":"medium","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.q1","stats.q3","stats.skew","stats.kurtosis","stats.outlier_rate","stats.n_outliers"],"model":"anthropic:claude-opus-4-7","narrative":"PopulationPGAC appears to be a population count tied to some geographic or administrative unit (PGAC), spanning 10 to roughly 925 million across 7,124 rows with only 0.07% nulls. The distribution is extraordinarily right-skewed (skew 25.5, kurtosis 1051) \u2014 the median is 130,300 while the mean is 4.88 million, and 17.8% of rows flag as outliers. With 1,509 unique values across 7,124 rows, the same population figures repeat heavily, suggesting many rows share the same geographic aggregate.","role":"feature","scope":"column","target":"PopulationPGAC","treatment":"log-transform before regression to tame the extreme right skew."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Binary Y/N flag indicating whether a record is on the frontier, with no nulls across 7124 rows. The split is imbalanced toward Y at 66.9% (4767) versus N at 2357, though entropy ratio of 0.92 shows both classes are well represented.","role":"feature","scope":"column","target":"Frontier","treatment":"Encode as a 0/1 indicator before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","stats.one_word_rate","stats.len_max","stats.duplicate_rate","stats.n_empty","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"MapAddress holds single-token PNG filenames (e.g. 'm00328.png'), with one_word_rate of 1.0 and max length 13, suggesting it points to a map image asset. 1500 of 7124 rows are empty strings and duplicate_rate is 0.352, so roughly a third of non-empty values repeat across rows \u2014 meaning many records share the same map. With 4616 unique values across 7124 rows, this behaves like a foreign reference to a finite set of map images rather than a free-text field.","role":"foreign_key","scope":"column","target":"MapAddress","treatment":"Treat as a categorical asset reference: impute or flag the 1500 empties and join to a map-image lookup."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.top_rate","stats.top_value","stats.entropy","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Binary Y/N flag indicating whether the Jesus Film is available for the entity (likely a language or people group). Heavily skewed toward 'Y' at 78.7% (5,610 of 7,124), with no nulls across all 7,124 rows. Entropy of 0.746 reflects the imbalance but still leaves a usable minority class of 1,514 'N' values.","role":"feature","scope":"column","target":"HasJesusFilm","treatment":"Encode as 0/1 boolean; account for class imbalance if used as a target."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Binary Y/N flag indicating nomadic status, with no nulls across 7124 rows. Severely imbalanced: 'N' dominates at 96.6% (6884 rows) versus only 240 'Y' cases, yielding a low entropy ratio of 0.21.","role":"feature","scope":"column","target":"Nomadic","treatment":"Encode as binary; consider class-weighting or stratified sampling due to severe imbalance."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.top_value","stats.top_rate","top_values","stats.cardinality"],"model":"anthropic:claude-opus-4-7","narrative":"This is a low-cardinality categorical describing the type of nomadic livelihood, with only 6 distinct values dominated by 'Agro-Pastoralists' (76.7% of non-nulls, 184 records). The column is almost entirely empty \u2014 null_rate is 0.9663, leaving roughly 240 populated rows out of 7124. Several values are comma-joined combinations (e.g., 'Agro-Pastoralists, Service or Trade'), suggesting the field encodes multi-label memberships as concatenated strings.","role":"feature","scope":"column","target":"NomadicTypeDescription","treatment":"Split comma-separated values into multi-hot indicators and treat missingness as its own category given the 96.6% null rate."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Creative Commons license version attached to a photo (e.g., 'CC BY 2.0', 'CC BY-SA 4.0'). The field is dominated by empty strings at 79.8% of 7124 rows, with only 16 distinct values and entropy ratio 0.33, so license metadata is missing for the vast majority of records. Among populated values, 'CC BY 2.0' (387) and 'CC BY-SA 4.0' (246) lead.","role":"metadata","scope":"column","target":"PhotoCCVersionText","treatment":"Treat empty string as missing and group rare licenses; use as a low-cardinality categorical only where photo licensing matters."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds the URL of the Creative Commons license version applied to an associated photo, drawn from a fixed set of 16 distinct license URIs. About 79.8% of rows (5688 of 7124) are empty strings, so the field is sparsely populated; among the populated minority, CC BY 2.0 (387) and CC BY-SA 4.0 (246) dominate. Entropy ratio of 0.33 confirms heavy concentration on the blank value.","role":"metadata","scope":"column","target":"PhotoCCVersionURL","treatment":"Treat empty strings as missing and collapse to a categorical license code before any modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Attribution string crediting the data, geography, and design sources for each map (e.g. Joshua Project, GMI, UNESCO, IMB). With 161 distinct values across 7124 rows, the top credit covers 28% of records and a blank string is the second most common value at 1505 rows; near-duplicates differing only by trailing punctuation (the same Omid/UNESCO credit appears with and without a final period) inflate cardinality.","role":"metadata","scope":"column","target":"MapCredits","treatment":"Normalise whitespace/punctuation to collapse near-duplicates, then drop from modelling as boilerplate provenance."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds attribution URLs for source maps, but 6919 of 7124 rows (top_rate 0.9712) are empty strings, leaving only 31 distinct values across the entire dataset. Among the populated entries, cartomission.com dominates with 100 occurrences while most other domains appear fewer than 10 times, producing a very long tail. Entropy ratio of 0.054 confirms there is almost no information here unless the empty string itself is treated as a meaningful 'no credit' signal.","role":"metadata","scope":"column","target":"MapCreditURL","treatment":"Keep as provenance metadata; do not use as a model feature given 97% blanks."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"A near-binary flag (N/Y) with a third state being an empty string, almost certainly indicating whether map copyright applies. 'N' dominates at 72.95% (5197/7124), blanks account for 1885 rows, and only 42 records are 'Y' \u2014 a severe class imbalance that makes the affirmative case nearly negligible.","role":"feature","scope":"column","target":"MapCopyright","treatment":"Normalize blanks to a missing/'N' category and treat as a low-signal binary flag given the 42-row positive class."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Creative Commons license version field for maps, but it is effectively empty: 7114 of 7124 rows (top_rate 0.9986) carry the blank string, leaving only 10 rows with actual licenses split across CC BY-SA 3.0 (8), CC0 1.0 (1), and CC BY 3.0 (1). Entropy is just 0.0166 (entropy_ratio 0.0083), so the column carries almost no information despite having 0% nulls \u2014 the missingness is encoded as empty strings rather than NaN.","role":"metadata","scope":"column","target":"MapCCVersionText","treatment":"Drop; near-constant blank with only 10 informative rows."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy","stats.entropy_ratio","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"MapCCVersionURL appears to hold a Creative Commons license URL associated with each map record, but it is essentially empty: 7114 of 7124 rows (top_rate 0.9986) carry the blank string, leaving just 10 rows split across three CC license URLs. Entropy is 0.017 (ratio 0.008), so the column carries almost no information despite having 4 distinct values and zero nulls (the missingness is encoded as \"\" rather than null).","role":"metadata","scope":"column","target":"MapCCVersionURL","treatment":"Drop; near-constant with empty-string standing in for missing."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"JF is a binary Y/N flag with no nulls across 7124 rows. The distribution is imbalanced: \"Y\" accounts for 78.7% (5610 rows) versus 1514 \"N\", giving an entropy ratio of 0.746. The column name is opaque, so the semantic meaning of the flag is not recoverable from the evidence.","role":"feature","scope":"column","target":"JF","treatment":"Encode as a 0/1 indicator; consider class imbalance if used as a target."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Binary Y/N flag indicating whether audio recordings exist for each row, with no nulls across 7124 records. The distribution is heavily imbalanced toward 'Y' at 86.9% (6188 vs 936), giving an entropy ratio of 0.56.","role":"feature","scope":"column","target":"AudioRecordings","treatment":"Encode as a 0/1 indicator; be mindful of class imbalance if used as a target."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Window1040 is a binary Y/N flag covering all 7124 rows with no nulls. The distribution is imbalanced: 'Y' accounts for 5910 rows (top_rate 0.8296) versus 1214 'N', giving an entropy ratio of 0.659. The column's semantic meaning isn't recoverable from the evidence, but it behaves like a clean indicator variable.","role":"feature","scope":"column","target":"Window1040","treatment":"Encode as a 0/1 indicator and watch for class imbalance when used as a predictor."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.url_rate","stats.one_word_rate","stats.duplicate_rate","stats.n_duplicates","stats.n_empty","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds URLs to people-group map images hosted on joshuaproject.net, with every non-empty value being a single token (one_word_rate 1.0, url_rate 0.79). 1,500 of 7,124 rows are empty strings and 2,508 are duplicates (duplicate_rate 0.35), meaning many people groups share the same map image (e.g., m00328.png appears 40 times). With 4,616 unique values across 7,124 rows, this is a reference link rather than a unique key.","role":"metadata","scope":"column","target":"PeopleGroupMapURL","treatment":"Keep as a display/reference URL; drop from modelling features."},{"confidence":"high","critiques":[],"evidence_keys":["url_rate","n_empty","n_duplicates","duplicate_rate","one_word_rate","top_values","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds URLs to expanded people-group map PDFs hosted on joshuaproject.net, with 72.3% of rows containing a URL and every value being a single token. 1,975 rows (about 27.7%) are empty strings, and 2,793 rows (39.2%) duplicate another value \u2014 e.g. m00328.pdf appears 40 times \u2014 suggesting many people groups share the same regional map.","role":"metadata","scope":"column","target":"PeopleGroupMapExpandedURL","treatment":"Treat as a reference link; drop from modelling or extract the map ID if joining to a maps table."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.len_min","stats.len_max","stats.url_rate","stats.one_word_rate","stats.duplicate_rate","top_words"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds Joshua Project people-group URLs, one per row, with every value a 48-character single-token https link (url_rate 1.0, one_word_rate 1.0, len_min and len_max both 48). All 7124 values are unique with zero nulls or duplicates, so it functions as a per-row identifier rather than a feature. The URLs encode a people-group ID and a country code suffix (e.g., /10375/tz, /10375/up), meaning the same group recurs across countries in the underlying key even though the full URL is unique.","role":"identifier","scope":"column","target":"PeopleGroupURL","treatment":"Drop from modelling; retain as a row-level link key or parse out the people-group ID and country code as separate features."},{"confidence":"high","critiques":[],"evidence_keys":["stats.url_rate","stats.one_word_rate","stats.duplicate_rate","stats.n_empty","n","n_unique","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds Joshua Project people-group photo URLs, with every populated cell being a single joshuaproject.net/assets/media/profiles/photos/.jpg link (url_rate 0.72, one_word_rate 1.0). 1971 of 7124 rows are empty strings (no nulls reported), and the same image URLs repeat heavily \u2014 duplicate_rate is 0.60 with only 2880 unique values, the top URL appearing 90 times. The same photo is clearly being reused across many people-group records rather than being a unique per-row asset.","role":"metadata","scope":"column","target":"PeopleGroupPhotoURL","treatment":"Treat as an optional asset link; drop or replace empty strings with null and do not use as a feature."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Country-level URLs pointing to joshuaproject.net profile pages, with the 2-letter country code as the path segment. There are 202 distinct countries across 7,124 rows and no nulls, but the distribution is heavily concentrated: India alone accounts for 28.5% of rows (2,032), with Pakistan (767) a distant second. Entropy ratio of 0.66 confirms moderate skew toward a handful of South Asian countries.","role":"foreign_key","scope":"column","target":"CountryURL","treatment":"Extract the trailing country code as a categorical key; treat the URL itself as redundant metadata."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"JPScaleText is a categorical field that holds a single value, \"Unreached\", across all 7124 rows with no nulls. With cardinality of 1 and entropy of 0, it carries no information and cannot discriminate between records. The constant value suggests this dataset has been pre-filtered to unreached people groups only.","role":"metadata","scope":"column","target":"JPScaleText","treatment":"Drop; constant column with zero entropy."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"Every one of the 7,124 rows holds the same URL, https://joshuaproject.net/assets/img/gauge/gauge-1.png, giving a single unique value and zero entropy. This looks like a static asset link (a JP Scale gauge image) attached to each record rather than a discriminating feature. It carries no information for analysis or modelling.","role":"metadata","scope":"column","target":"JPScaleImageURL","treatment":"Drop; constant column with a single value across all rows."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.duplicate_rate","stats.n_duplicates","stats.n_empty","stats.one_word_rate","stats.len_mean","stats.len_median","stats.word_mean","stats.readability_flesch_mean","language_counts","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text English summaries describing South Asian people groups (Rajputs, Jats, Bania, Beldar, etc.), averaging 51 words with median length 316 characters. Quality is poor: 3,167 of 7,124 rows (44%) are empty strings and another 3,439 are duplicates, leaving only 3,685 unique values and a 48% duplicate rate. Several near-identical Rajput paragraphs differ by only a word or two, suggesting lightly edited copies of the same source text rather than independent summaries. Flesch readability of 30.4 indicates fairly difficult prose.","role":"free_text","scope":"column","target":"Summary","treatment":"Deduplicate near-identical entries and drop or impute the 3,167 empty rows before tokenizing and embedding."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.duplicate_rate","stats.n_duplicates","stats.n_empty","stats.one_word_rate","stats.len_mean","stats.word_mean","stats.readability_flesch_mean","stats.vocab_size","top_values","language_counts"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text English prose describing barriers to Christian evangelism among various people groups (Rajputs, Jats, Bosniaks, Azeri, etc.), averaging 18 words and 107 characters per entry. Notably, 3167 of 7124 rows are empty strings and the duplicate rate is 0.489, with a single Rajput-pride passage repeated 88 times and a near-identical Jat passage appearing as both 74- and 7-count variants. Readability is low (Flesch 31.6) and vocabulary is modest (9760 unique words), consistent with a templated missiological description field.","role":"free_text","scope":"column","target":"Obstacles","treatment":"Treat empties as missing, dedupe near-identical passages, then tokenize and embed for downstream topic or similarity analysis."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.duplicate_rate","stats.n_duplicates","stats.n_empty","stats.len_median","stats.word_median","stats.len_mean","stats.len_p95","stats.readability_flesch_mean","stats.vocab_size","top_values","language_counts"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text English prose describing outreach/engagement strategies for various people groups, likely a 'how to reach' field in a missions dataset. Over half the rows (3883 of 7124) are empty strings and duplicate_rate is 0.60, with the same Jats and Rajputs paragraphs repeating dozens of times \u2014 so the median length and word count are 0. Readability is low (Flesch 27.3) and vocabulary reaches 7803 tokens across the non-empty rows.","role":"free_text","scope":"column","target":"HowReach","treatment":"Treat empty strings as missing, deduplicate boilerplate, then tokenize and embed for downstream NLP."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","language_counts","stats.duplicate_rate","stats.n_empty","stats.one_word_rate","stats.len_max","stats.len_mean","stats.readability_flesch_mean","top_values","top_words"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text prayer prompts for an unreached-people-group / church-planting dataset, written in English (1473 detected) and centered on words like 'pray', 'Christ', 'among'. The field is sparsely populated: 5032 of 7124 rows are empty and only 1713 unique strings exist, giving a 0.76 duplicate rate as the same boilerplate prayer is reused across people groups (top non-empty value repeats 146 times). Readability is low (Flesch 19.5) and length varies wildly from 0 to 649 chars, so the column is a mix of nothing, one-liners, and full paragraphs.","role":"free_text","scope":"column","target":"PrayForChurch","treatment":"Treat as optional long-form text: impute empties as missing and tokenize/embed the rest before any modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.duplicate_rate","stats.n_duplicates","stats.n_empty","stats.len_mean","stats.len_max","stats.readability_flesch_mean","language_counts","top_values","top_words"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text prayer points for people groups (PG), each entry a short paragraph of intercessions led by the verb 'pray' (5450 occurrences). Nearly half the rows are empty (3405 of 7124) and another large chunk reuse boilerplate templates \u2014 duplicate_rate 0.517 with the top non-empty value repeating 88 times \u2014 so unique content is far less than the 3441 distinct strings suggest. Readability is low (Flesch mean 32.7) and all detected language is English (2528 rows tagged en).","role":"free_text","scope":"column","target":"PrayForPG","treatment":"Treat as free-text: drop empties, dedupe boilerplate, then tokenize/embed if used as a feature."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","n_unique","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column is named \"Resources\" with 7124 rows and zero nulls, but saturn skipped profiling so the kind is unknown and no unique count or value statistics were computed. Without type inference or sample values, its content (numeric, list, text, or identifier) cannot be determined from the evidence.","role":"other","scope":"column","target":"Resources","treatment":"Re-profile or inspect raw samples to establish type before any downstream use."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `country_data` was skipped by the profiler, so its kind is unrecorded and no statistics, uniqueness, or value distribution are available. The only confirmed signals are 7124 rows with a 0.0 null rate. Without further inspection, the contents (likely some country-related payload given the name) cannot be characterised.","role":"other","scope":"column","target":"country_data","treatment":"Re-profile or manually inspect this column before any downstream use."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","n_unique","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `language_data` was skipped by the profiler \u2014 its kind is unrecognised and no descriptive statistics, uniqueness count, or value samples were emitted. Only the row count (7124) and a null rate of 0.0 are available, so nothing can be said about content, cardinality, or distribution. The name hints at linguistic payloads (possibly nested or serialised), but this is not corroborated by evidence.","role":"other","scope":"column","target":"language_data","treatment":"Re-profile after parsing or casting to a supported type before deciding on use."}],"providers":["anthropic:claude-opus-4-7"],"total_usage":{"completion_tokens":31095,"prompt_tokens":141672,"total_tokens":172767}},"language_counts":{"ceb":1,"de":4,"en":11903,"eo":2,"es":1,"id":1,"ilo":1,"it":2,"min":1,"pt":2},"meta":{"generated_at":"2026-05-01T18:35:56+00:00","mode":"full","row_count":7124,"sampled_rows":7124,"seed":42,"source":"/home/coolhand/html/datavis/data_trove/joshua-project/joshua_project_unreached.parquet"},"notes":[],"saturn_version":"0.2.0","schema":{"AffinityBloc":"categorical","AudioRecordings":"categorical","BibleStatus":"numeric","BibleYear":"categorical","Category":"categorical","Continent":"categorical","CountOfCountries":"numeric","CountOfProvinces":"unknown","CountryURL":"categorical","Ctry":"categorical","Frontier":"categorical","GSEC":"categorical","HasAudioRecordings":"categorical","HasJesusFilm":"categorical","HowReach":"text","ISO3":"categorical","IndigenousCode":"categorical","JF":"categorical","JPScale":"numeric","JPScaleImageURL":"categorical","JPScalePC":"categorical","JPScalePGAC":"categorical","JPScaleText":"categorical","LRTop100":"categorical","Latitude":"numeric","LeastReached":"categorical","LeastReachedPC":"categorical","LeastReachedPGAC":"categorical","LocationInCountry":"text","Longitude":"numeric","MapAddress":"text","MapCCVersionText":"categorical","MapCCVersionURL":"categorical","MapCopyright":"categorical","MapCreditURL":"categorical","MapCredits":"categorical","NTOnline":"categorical","NTYear":"categorical","NaturalName":"text","NaturalPronunciation":"text","Nomadic":"categorical","NomadicTypeDescription":"categorical","NumberLanguagesSpoken":"numeric","Obstacles":"text","OfficialLang":"categorical","PCBuddhism":"numeric","PCEthnicReligions":"numeric","PCHinduism":"numeric","PCIslam":"numeric","PCNonReligious":"numeric","PCOtherSmall":"numeric","PCUnknown":"numeric","PeopNameAcrossCountries":"text","PeopNameInCountry":"text","PeopleCluster":"categorical","PeopleGroupMapExpandedURL":"text","PeopleGroupMapURL":"text","PeopleGroupPhotoURL":"text","PeopleGroupURL":"text","PeopleID1":"numeric","PeopleID2":"numeric","PeopleID3":"numeric","PeopleID3ROG3":"text","PercentAdherents":"categorical","PercentChristianPC":"categorical","PercentChristianPGAC":"categorical","PercentEvangelical":"categorical","PercentEvangelicalPC":"categorical","PercentEvangelicalPGAC":"categorical","PhotoAddress":"text","PhotoCCVersionText":"categorical","PhotoCCVersionURL":"categorical","PhotoCopyright":"categorical","PhotoCreativeCommons":"categorical","PhotoCreditURL":"categorical","PhotoCredits":"categorical","PhotoPermission":"categorical","Population":"numeric","PopulationPGAC":"numeric","PortionsYear":"categorical","PrayForChurch":"text","PrayForPG":"text","PrimaryLanguageDialect":"categorical","PrimaryLanguageName":"text","PrimaryReligion":"categorical","PrimaryReligionPC":"categorical","PrimaryReligionPGAC":"categorical","ProfileTextExists":"categorical","RLG3":"numeric","RLG3PC":"numeric","RLG3PGAC":"numeric","RLG4":"numeric","ROG2":"categorical","ROG3":"categorical","ROL3":"text","ROP1":"categorical","ROP2":"categorical","ROP3":"numeric","RegionCode":"numeric","RegionName":"categorical","ReligionSubdivision":"categorical","Resources":"unknown","SecurityLevel":"numeric","SpeakNationalLang":"unknown","Summary":"text","TranslationNeedQuestionable":"unknown","Window1040":"categorical","country_data":"unknown","language_data":"unknown"}}
