{"columns":[{"alerts":[{"code":"near_unique","level":"info","message":"100.0% of rows are unique strings"},{"code":"one_word","level":"warn","message":"100.0% rows are a single word"}],"column":"_id","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,8139,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[23.5,23.525,23.55,23.575,23.6,23.625,23.65,23.675,23.7,23.725,23.75,23.775,23.8,23.825,23.85,23.875,23.9,23.925,23.95,23.975,24.0,24.025,24.05,24.075,24.1,24.125,24.15,24.175,24.2,24.225,24.25,24.275,24.3,24.325,24.35,24.375,24.4,24.425,24.45,24.475,24.5]},"near_unique":true,"sample":["5fc4172fc6cd28ebd99dd0f5","61b6434e0109cc2a5dcc5bd7","61eb3a497153a097cfec9ef7","61d3a1cc0109cc2a5d8091ae","5fce98661b4f187382e1067e","622ba824a936b9560071aede","5fce98691b4f187382e108e0","61ffe8d4d80f14ddc2373e83","61d4fcbc0109cc2a5d118c21","5fc419791ebf67b9fbe4b919","61418f1c73f719004f2af9f1","6088127328f29d0115de36a2","5fc41a0d1ebf67b9fbe50464","5fc4172ec6cd28ebd99dd0f2","5fc41a131ebf67b9fbe50850","5fc419d61ebf67b9fbe4e66c","5fc419a21ebf67b9fbe4cb66","61dc89550109cc2a5dd4d249","6239521aa936b9560081fa87","5fce98621b4f187382e10383","5fc41a281ebf67b9fbe512d9","5fc419751ebf67b9fbe4b75a","5fc419bd1ebf67b9fbe4da2f","5fc4199b1ebf67b9fbe4c827","6197122cdc71c3764eccf431","61b6435b0109cc2a5dcc6284","60ede62a1e8b306b92d7402a","5fc419da1ebf67b9fbe4e8aa","5fc419a21ebf67b9fbe4cb33","622c6be5a936b956009b9c16","616f56e9b2ba10846638eeaa","62395249a936b95600820ccf","6175119cb2ba1084666931e2","5fce985f1b4f187382e1027c","5fce98571b4f187382e0ffe4","5fce98691b4f187382e10850","6212a949d80f14ddc202f177","6088120a28f29d0115de2fac","5fce986b1b4f187382e10973","6088126b28f29d0115de361e","61d055720109cc2a5df9f298","6209975fd80f14ddc2979b24","5fc41a051ebf67b9fbe50043","6209428cd80f14ddc2864838","6222238fdc2980b9632c814f","6230cb13a936b9560081d28c","5fc41a3a1ebf67b9fbe51a17","5fce985f1b4f187382e10288","5fc419b51ebf67b9fbe4d621","61f8523e642b77b2dffcc213"],"top_values":[],"top_words":[["5fc4172ec6cd28ebd99dd0e2",1],["5fc4172ec6cd28ebd99dd0ea",1],["5fc4172ec6cd28ebd99dd0ed",1],["5fc4172ec6cd28ebd99dd0ee",1],["5fc419171ebf67b9fbe48615",1],["5fc4172ec6cd28ebd99dd0ef",1],["5fc4172ec6cd28ebd99dd0e8",1],["5fc419171ebf67b9fbe485a2",1],["5fc4172ec6cd28ebd99dd0f1",1],["5fc4172fc6cd28ebd99dd0f5",1],["5fc419171ebf67b9fbe485b2",1],["5fc419171ebf67b9fbe485c3",1],["5fc419171ebf67b9fbe48636",1],["5fc4172ec6cd28ebd99dd0ec",1],["5fc419161ebf67b9fbe48571",1],["5fc419161ebf67b9fbe4858a",1],["5fc419171ebf67b9fbe485aa",1],["5fc419171ebf67b9fbe4863e",1],["5fc419171ebf67b9fbe48648",1],["5fc419181ebf67b9fbe4869f",1],["5fc419181ebf67b9fbe486a7",1],["5fc4172ec6cd28ebd99dd0e4",1],["5fc4172ec6cd28ebd99dd0e3",1],["5fc4172ec6cd28ebd99dd0e9",1],["5fc4172ec6cd28ebd99dd0f0",1]],"vocab_skipped":null,"word_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,8139,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[0.5,0.5333333333333333,0.5666666666666667,0.6,0.6333333333333333,0.6666666666666666,0.7,0.7333333333333334,0.7666666666666666,0.8,0.8333333333333333,0.8666666666666667,0.9,0.9333333333333333,0.9666666666666667,1.0,1.0333333333333332,1.0666666666666667,1.1,1.1333333333333333,1.1666666666666665,1.2,1.2333333333333334,1.2666666666666666,1.3,1.3333333333333335,1.3666666666666667,1.4,1.4333333333333333,1.4666666666666668,1.5]}},"kind":"text","n":8139,"n_null":0,"n_unique":8139,"null_rate":0.0,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":0.0,"emoji_rate":0.0,"len_max":24,"len_mean":24.0,"len_median":24.0,"len_min":24,"len_p95":24.0,"n_duplicates":0,"n_empty":0,"one_word_rate":1.0,"readability_flesch_mean":31.967000000000034,"url_rate":0.0,"vocab_size":8139,"word_mean":1.0,"word_median":1.0}},{"alerts":[{"code":"one_word","level":"warn","message":"59.8% rows are a single word"},{"code":"short_text","level":"info","message":"95th-percentile length under 20 chars"}],"column":"display_name","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[329,1711,1902,1037,1236,1354,275,167,39,27,31,4,14,2,2,2,0,1,1,1,1,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,1],"edges":[1.0,3.4,5.8,8.2,10.6,13.0,15.399999999999999,17.8,20.2,22.599999999999998,25.0,27.4,29.799999999999997,32.2,34.6,37.0,39.4,41.8,44.199999999999996,46.6,49.0,51.4,53.8,56.199999999999996,58.599999999999994,61.0,63.4,65.8,68.2,70.6,73.0,75.39999999999999,77.8,80.2,82.6,85.0,87.39999999999999,89.8,92.2,94.6,97.0]},"near_unique":false,"sample":["sree","josh","null","dcabatin","Markella","ThanosVav","Josh Barton","erika","ciarrariley","Sascha Nolte","Ferras","Steve Erickson","Bryan Colley","Sally Jane Black","Steven Clarke","Ryan Oliver","chris\ud83e\udec0","Skrana","hsblechman","isabel","Driver","Katie \u2744\ufe0f","Gillian Kaney","sophie b","null","David Block","Sid V \ud83c\udf2a\ufe0f","rcjohnso","Forrest Cardamenis","omar","firas18","Jack Knightley","Donnie","NickyD316","megan","I.V.","DD34","ky","Jennifer","Henry","Alex Kennedy","brettasaurus","Jacob Neff","Eibon_","Dernager","olivia pincus","James Lafleur","Travis","Clare","chefaustin"],"top_values":[["null",307],["Sam",12],["Jack",10],["sam",10],["jack",8],["emma",8],["Adam",8],["Nathan",8],["alex",8],["Jacob",8],["Dylan",8],["Josh",8],["chloe",7],["Aaron",7],["Matt",7],["Ryan",7],["Alex",7],["Daniel",6],["Kevin",6],["Ethan",6]],"top_words":[["null",308],["matt",47],["sam",45],["alex",43],["chris",39],["david",37],["jack",36],["ben",35],["michael",35],["josh",34],["andrew",33],["\u2728",33],["the",32],["daniel",31],["ryan",31],["james",29],["adam",28],["paul",26],["nick",25],["tyler",25],["luke",24],["ethan",24],["thomas",23],["john",23],["nathan",23]],"vocab_skipped":null,"word_histogram":{"counts":[4866,2867,0,301,0,62,0,20,0,7,0,5,0,3,0,5,0,0,1,0,1,0,0,0,0,0,0,0,0,1],"edges":[1.0,1.5333333333333332,2.0666666666666664,2.6,3.1333333333333333,3.6666666666666665,4.2,4.733333333333333,5.266666666666667,5.8,6.333333333333333,6.866666666666666,7.4,7.933333333333334,8.466666666666667,9.0,9.533333333333333,10.066666666666666,10.6,11.133333333333333,11.666666666666666,12.2,12.733333333333333,13.266666666666666,13.8,14.333333333333334,14.866666666666667,15.4,15.933333333333334,16.46666666666667,17.0]}},"kind":"text","n":8139,"n_null":0,"n_unique":7136,"null_rate":0.0,"stats":{"allcaps_rate":0.019535569480280134,"boilerplate_rate":0.0,"duplicate_rate":0.12323381250767908,"emoji_rate":0.05836097800712618,"len_max":97,"len_mean":9.283327190072491,"len_median":9.0,"len_min":1,"len_p95":16.0,"n_duplicates":1003,"n_empty":0,"one_word_rate":0.5978621452266863,"readability_flesch_mean":45.673900000000025,"url_rate":0.0,"vocab_size":7487,"word_mean":1.478928615309006,"word_median":1.0}},{"alerts":[{"code":"null_rate","level":"warn","message":"41.7% null"},{"code":"high_skew","level":"info","message":"skew=+11.24"}],"column":"num_ratings_pages","extras":{"histogram":{"counts":[2911,1307,355,100,36,15,9,1,3,3,2,2,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1],"edges":[1.0,31.175,61.35,91.525,121.7,151.875,182.05,212.225,242.4,272.575,302.75,332.925,363.1,393.27500000000003,423.45,453.625,483.8,513.975,544.15,574.325,604.5,634.6750000000001,664.85,695.025,725.2,755.375,785.5500000000001,815.725,845.9,876.075,906.25,936.4250000000001,966.6,996.775,1026.95,1057.125,1087.3,1117.4750000000001,1147.65,1177.825,1208.0]},"sample":[1.0,40.0,23.0,32.0,26.0,46.0,13.0,72.0,7.0,30.0,13.0,47.0,11.0,10.0,1.0,45.0,44.0,9.0,48.0,17.0,42.0,53.0,34.0,24.0,69.0,24.0,35.0,11.0,13.0,37.0,60.0,29.0,31.0,41.0,14.0,30.0,45.0,26.0,74.0,1.0,24.0,18.0,10.0,60.0,13.0,57.0,19.0,28.0,45.0,21.0,40.0,23.0,7.0,16.0,35.0,29.0,31.0,49.0,25.0,42.0,8.0,92.0,45.0,37.0,18.0,15.0,23.0,12.0,7.0,44.0,48.0,25.0,19.0,17.0,12.0,11.0,33.0,14.0,47.0,86.0,20.0,26.0,18.0,18.0,6.0,31.0,19.0,40.0,18.0,38.0,9.0,30.0,25.0,59.0,192.0,28.0,29.0,26.0,6.0,66.0,5.0,22.0,66.0,1.0,97.0,9.0,54.0,19.0,15.0,7.0,1.0,26.0,132.0,10.0,25.0,67.0,36.0,16.0,11.0,20.0,22.0,33.0,38.0,26.0,14.0,25.0,27.0,21.0,1.0,20.0,9.0,39.0,31.0,161.0,45.0,19.0,25.0,19.0,44.0,28.0,22.0,29.0,5.0,3.0,18.0,15.0,31.0,27.0,27.0,39.0,72.0,43.0,34.0,40.0,45.0,38.0,51.0,26.0,24.0,14.0,16.0,130.0,108.0,79.0,27.0,18.0,33.0,49.0,21.0,15.0,18.0,19.0,15.0,2.0,20.0,50.0,41.0,27.0,37.0,36.0,64.0,13.0,25.0,45.0,19.0,9.0,1.0,22.0,18.0,2.0,12.0,5.0,23.0,41.0,20.0,50.0,30.0,21.0,18.0,16.0,26.0,11.0,39.0,31.0,16.0,13.0,41.0,35.0,40.0,1.0,23.0,16.0,36.0,36.0,5.0,16.0,12.0,14.0,147.0,53.0,62.0,1.0,41.0,10.0,25.0,18.0,24.0,10.0,21.0,18.0,53.0,19.0,36.0,11.0,51.0,46.0,92.0,14.0,34.0,19.0,100.0,33.0,27.0,3.0,30.0,52.0,95.0,23.0,38.0,71.0,7.0,28.0,95.0,10.0,22.0,14.0,28.0,60.0,30.0,21.0,18.0,27.0,23.0,13.0,29.0,26.0,53.0,25.0,25.0,32.0,20.0,21.0,45.0,39.0,22.0,1.0,48.0,27.0,30.0,21.0,18.0,11.0,14.0,32.0,36.0,79.0,31.0,13.0,37.0,11.0,23.0,33.0,21.0,39.0,31.0,24.0,32.0,27.0,85.0,15.0,28.0,16.0,28.0,51.0,20.0,21.0,28.0,58.0,18.0,30.0,12.0,52.0,41.0,43.0,1.0,24.0,39.0,45.0,39.0,1.0,12.0,57.0,24.0,21.0,33.0,53.0,23.0,27.0,25.0,48.0,91.0,10.0,98.0,16.0,22.0,47.0,28.0,44.0,40.0,20.0,50.0,12.0,22.0,22.0,23.0,58.0,18.0,66.0,46.0,29.0,1.0,38.0,45.0,25.0,80.0,52.0,1.0,117.0,6.0,20.0,70.0,15.0,18.0,34.0,15.0,21.0,40.0,18.0,33.0,18.0,1.0,92.0,43.0,43.0,10.0,59.0,37.0,60.0,32.0,39.0,18.0,226.0,5.0,74.0,52.0,22.0,154.0,97.0,33.0,19.0,99.0,26.0,22.0,37.0,26.0,22.0,25.0,9.0,42.0,49.0,19.0,20.0,15.0,48.0,1.0,94.0,46.0,32.0,34.0,29.0,54.0,7.0,37.0,28.0,15.0,91.0,11.0,31.0,9.0,14.0,39.0,15.0,92.0,1.0,52.0,26.0,31.0,27.0,32.0,26.0,57.0,16.0,14.0,41.0,2.0,16.0,17.0,11.0,4.0,10.0,23.0,15.0,17.0,25.0,9.0,98.0,23.0,23.0,11.0,15.0,41.0,61.0,53.0,40.0,22.0,8.0,5.0,1.0,27.0,3.0,16.0,18.0,22.0,35.0,6.0,21.0,7.0,20.0,106.0,20.0,1.0,36.0,22.0,5.0,8.0,15.0,32.0,14.0,24.0,35.0,121.0,23.0,1.0,5.0,9.0,33.0,11.0,7.0,52.0,42.0,59.0,32.0,29.0,32.0,17.0,10.0,20.0,14.0,12.0,10.0]},"kind":"numeric","n":8139,"n_null":3392,"n_unique":177,"null_rate":0.4167588155793095,"stats":{"iqr":27.0,"kurtosis":298.3437560786724,"max":1208.0,"mean":32.814830419212136,"median":25.0,"min":1.0,"n_outliers":236,"outlier_rate":0.04971560985885823,"q1":15.0,"q3":42.0,"skew":11.237209707557714,"std":35.2323640506697,"zero_rate":0.0}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=+3.92"},{"code":"outliers","level":"warn","message":"6.2% rows beyond 1.5 IQR"}],"column":"num_reviews","extras":{"histogram":{"counts":[3145,2163,1165,615,396,217,158,98,56,37,22,15,10,11,5,9,4,1,2,1,0,1,2,1,0,0,0,0,1,0,0,1,0,1,1,0,0,0,0,1],"edges":[0.0,429.6,859.2,1288.8000000000002,1718.4,2148.0,2577.6000000000004,3007.2000000000003,3436.8,3866.4,4296.0,4725.6,5155.200000000001,5584.8,6014.400000000001,6444.0,6873.6,7303.200000000001,7732.8,8162.400000000001,8592.0,9021.6,9451.2,9880.800000000001,10310.400000000001,10740.0,11169.6,11599.2,12028.800000000001,12458.400000000001,12888.0,13317.6,13747.2,14176.800000000001,14606.400000000001,15036.0,15465.6,15895.2,16324.800000000001,16754.4,17184.0]},"sample":[461.0,3211.0,3477.0,1881.0,1877.0,1095.0,350.0,672.0,391.0,4801.0,817.0,244.0,838.0,2075.0,189.0,3094.0,339.0,1351.0,1553.0,346.0,244.0,65.0,1533.0,723.0,989.0,224.0,765.0,1451.0,667.0,896.0,59.0,281.0,2150.0,2033.0,338.0,884.0,1653.0,385.0,418.0,3275.0,961.0,686.0,192.0,234.0,460.0,997.0,667.0,2196.0,97.0,979.0,441.0,819.0,507.0,902.0,517.0,1069.0,347.0,6738.0,701.0,1239.0,26.0,1188.0,640.0,585.0,16.0,387.0,159.0,1153.0,3002.0,592.0,1089.0,1019.0,258.0,181.0,1762.0,765.0,1070.0,430.0,808.0,1145.0,769.0,369.0,656.0,1181.0,591.0,678.0,145.0,1002.0,155.0,358.0,416.0,758.0,727.0,694.0,4094.0,331.0,2106.0,1285.0,591.0,971.0,471.0,532.0,299.0,2240.0,426.0,1296.0,1285.0,1178.0,2347.0,1544.0,1005.0,624.0,493.0,332.0,502.0,187.0,693.0,1197.0,638.0,741.0,380.0,209.0,1123.0,800.0,1436.0,1149.0,260.0,396.0,5233.0,805.0,307.0,456.0,775.0,1804.0,261.0,593.0,523.0,465.0,484.0,292.0,1265.0,544.0,1035.0,472.0,108.0,695.0,229.0,321.0,1409.0,2307.0,737.0,635.0,620.0,1189.0,17.0,150.0,840.0,1531.0,1379.0,378.0,605.0,1360.0,1221.0,397.0,56.0,426.0,25.0,383.0,686.0,973.0,357.0,670.0,368.0,21.0,357.0,1745.0,6498.0,386.0,577.0,2714.0,1426.0,4604.0,436.0,1003.0,1246.0,674.0,379.0,678.0,1401.0,2466.0,2495.0,2516.0,1509.0,3817.0,1547.0,2.0,373.0,975.0,808.0,810.0,398.0,542.0,1822.0,1263.0,356.0,1466.0,371.0,196.0,2364.0,24.0,662.0,321.0,311.0,388.0,1431.0,1190.0,627.0,1636.0,3247.0,6328.0,1119.0,141.0,552.0,557.0,663.0,840.0,1397.0,1283.0,1672.0,305.0,2074.0,1470.0,281.0,1599.0,989.0,3582.0,2283.0,585.0,3297.0,1270.0,464.0,341.0,422.0,1361.0,886.0,2972.0,558.0,310.0,203.0,211.0,1719.0,668.0,822.0,214.0,200.0,1308.0,359.0,463.0,1327.0,357.0,503.0,171.0,408.0,855.0,160.0,444.0,2905.0,285.0,733.0,1037.0,1577.0,189.0,518.0,744.0,696.0,281.0,520.0,716.0,2015.0,244.0,1322.0,635.0,677.0,688.0,374.0,0.0,166.0,694.0,569.0,803.0,72.0,136.0,270.0,538.0,92.0,332.0,1554.0,280.0,987.0,1076.0,649.0,177.0,55.0,10.0,609.0,766.0,1202.0,116.0,3079.0,221.0,954.0,29.0,349.0,739.0,258.0,657.0,665.0,455.0,1765.0,657.0,264.0,1139.0,87.0,410.0,388.0,785.0,56.0,396.0,169.0,281.0,366.0,283.0,255.0,490.0,844.0,194.0,150.0,1388.0,848.0,705.0,52.0,653.0,1124.0,695.0,988.0,373.0,78.0,92.0,131.0,30.0,2223.0,127.0,243.0,1374.0,51.0,596.0,367.0,196.0,24.0,647.0,643.0,88.0,154.0,637.0,1871.0,1171.0,345.0,899.0,967.0,2619.0,1235.0,978.0,621.0,70.0,62.0,146.0,540.0,667.0,1876.0,430.0,1412.0,754.0,590.0,319.0,343.0,1062.0,509.0,404.0,297.0,595.0,562.0,207.0,309.0,789.0,299.0,315.0,961.0,182.0,15.0,425.0,21.0,472.0,336.0,547.0,110.0,3017.0,665.0,181.0,1154.0,513.0,0.0,540.0,89.0,727.0,547.0,121.0,101.0,0.0,62.0,351.0,113.0,1270.0,972.0,55.0,379.0,141.0,447.0,1955.0,193.0,377.0,271.0,180.0,1372.0,186.0,0.0,9.0,577.0,1390.0,67.0,699.0,520.0,95.0,344.0,513.0,103.0,78.0,562.0,685.0,704.0,270.0,49.0,548.0,992.0,500.0,192.0,53.0,671.0,320.0,348.0,43.0,832.0,59.0,272.0,546.0,26.0,141.0,760.0,99.0,19.0,765.0,394.0,568.0,10.0,396.0,402.0,18.0,13.0,315.0,38.0,214.0,465.0,573.0,262.0,1024.0,88.0,446.0,819.0,102.0,1.0,129.0,295.0,554.0,166.0,230.0,322.0,1310.0,595.0,200.0,1701.0,988.0]},"kind":"numeric","n":8139,"n_null":0,"n_unique":2416,"null_rate":0.0,"stats":{"iqr":863.0,"kurtosis":33.30564744361335,"max":17184.0,"mean":868.3644182331982,"median":588.0,"min":0.0,"n_outliers":505,"outlier_rate":0.062046934512839415,"q1":267.0,"q3":1130.0,"skew":3.92255544165068,"std":979.1468568887229,"zero_rate":0.009583486914854404}},{"alerts":[{"code":"near_unique","level":"info","message":"100.0% of rows are unique strings"},{"code":"one_word","level":"warn","message":"100.0% rows are a single word"},{"code":"short_text","level":"info","message":"95th-percentile length under 20 chars"}],"column":"username","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[9,0,0,42,0,0,168,0,0,343,0,0,570,0,0,778,0,0,941,0,0,937,0,0,996,0,0,932,0,0,805,0,0,654,0,0,483,0,0,481],"edges":[2.0,2.325,2.65,2.975,3.3,3.625,3.95,4.275,4.6,4.925000000000001,5.25,5.575,5.9,6.2250000000000005,6.55,6.875,7.2,7.525,7.8500000000000005,8.175,8.5,8.825,9.15,9.475000000000001,9.8,10.125,10.450000000000001,10.775,11.1,11.425,11.75,12.075000000000001,12.4,12.725,13.05,13.375,13.700000000000001,14.025,14.35,14.675,15.0]},"near_unique":true,"sample":["iaiaiand","joshuapeinado","hilanna","dcabatin","markella","thanosvav","josh2410","paintmytrust","ciarrariley","psychotic","ferras96","steevee","jupiterkansas","fuchsiadyke","steven_clarke","ryan_oliver","chris_ofdeath","skrana","hsblechman","isajjar","driveridrive","ktc","gillyk82","ettinauer","mentallytwelve","davidraider88","iznogoud","rcjohnso","forrestc","omaralicetin","firas18","jackknightley","dontjo","nickyd","sharktale","vishnevetsky","dd34","dqnielplainvewz","jenniferv","henryg9876","alexkennedy","brettasaurus","jakeneff","eibon_","dernager","olivialow","rusty_james","travis_kyker","clarefranceso","chefaustin"],"top_values":[],"top_words":[["deathproof",1],["superpulse",1],["lilfilm",1],["ianamurray",1],["punchdrunklizzy",1],["elihayes",1],["colonelmortimer",1],["allisoncm",1],["juggernaut323",1],["iaiaiand",1],["kaylafavia",1],["sonofjorel",1],["siegel",1],["dirkh",1],["nycsubwayrat",1],["filipe_furtado",1],["sopheyquinn",1],["bluevelvets",1],["jakepcole",1],["riverjphoenix",1],["truman",1],["davidehrlich",1],["kurstboy",1],["jay",1],["holliehorror",1]],"vocab_skipped":null,"word_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,8139,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[0.5,0.5333333333333333,0.5666666666666667,0.6,0.6333333333333333,0.6666666666666666,0.7,0.7333333333333334,0.7666666666666666,0.8,0.8333333333333333,0.8666666666666667,0.9,0.9333333333333333,0.9666666666666667,1.0,1.0333333333333332,1.0666666666666667,1.1,1.1333333333333333,1.1666666666666665,1.2,1.2333333333333334,1.2666666666666666,1.3,1.3333333333333335,1.3666666666666667,1.4,1.4333333333333333,1.4666666666666668,1.5]}},"kind":"text","n":8139,"n_null":0,"n_unique":8139,"null_rate":0.0,"stats":{"allcaps_rate":0.00036859565057132326,"boilerplate_rate":0.0,"duplicate_rate":0.0,"emoji_rate":0.0,"len_max":15,"len_mean":9.793463570463201,"len_median":10.0,"len_min":2,"len_p95":15.0,"n_duplicates":0,"n_empty":0,"one_word_rate":1.0,"readability_flesch_mean":2.780000000000034,"url_rate":0.0,"vocab_size":8139,"word_mean":1.0,"word_median":1.0}}],"insights":{"errors":[],"insights":[{"confidence":"high","critiques":[],"evidence_keys":["row_count","column_count","num_reviews.stats","num_ratings_pages.stats","num_ratings_pages.null_rate","display_name.stats","display_name.top_values","username.n_unique","_id.n_unique"],"featured_charts":[{"caption":"Look at the long right tail \u2014 most users sit well below the 868 mean while a few hit thousands of reviews.","column":"num_reviews","kind":"histogram"},{"caption":"Same skew pattern as reviews, but note that 41.7% of values are missing before reading the distribution.","column":"num_ratings_pages","kind":"histogram"},{"caption":"Top display names show common first names like Sam and Jack, plus 307 literal 'null' entries flagging data quality issues.","column":"display_name","kind":"bar"},{"caption":"Most display names are short (median 9 chars) but the max stretches to 97 \u2014 check for outlier-style names.","column":"display_name","kind":"length"}],"model":"anthropic:claude-opus-4-7","narrative":"This dataset contains 8,139 Letterboxd user profiles with 5 columns covering identifiers (username, _id), a display name, and two activity metrics (num_reviews, num_ratings_pages). The activity metrics are the most interesting signal: num_reviews is heavily right-skewed with a mean of 868 but a median of 588 and a max of 17,184, and num_ratings_pages shows similar skew along with a 41.7% null rate that warrants investigation. Display names are also worth a look \u2014 about 60% are one-word, 12.3% are duplicates, and 'null' literally appears 307 times as a value, suggesting some data quality issues. The username and _id columns are fully unique identifiers and can largely be ignored for analytical purposes.","scope":"dataset","target":"__global__"},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.len_min","stats.len_max","stats.len_mean","stats.one_word_rate","stats.duplicate_rate","stats.vocab_size","top_words"],"model":"anthropic:claude-opus-4-7","narrative":"This column is a per-row identifier, almost certainly MongoDB ObjectIds: every one of the 8139 values is unique, exactly 24 characters long, single-token, and the samples are 24-char hex strings. There are no nulls, duplicates, or empties, and vocab_size equals n, confirming a pure primary key with no analytic content.","role":"identifier","scope":"column","target":"_id","treatment":"Drop for modelling; retain only as a join key."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.one_word_rate","stats.len_median","stats.word_median","stats.duplicate_rate","stats.n_duplicates","stats.emoji_rate","stats.vocab_size","top_values","top_words"],"model":"anthropic:claude-opus-4-7","narrative":"Short user display names: nearly 60% are a single word (one_word_rate 0.5978), median length 9 chars and median word count 1, with the top values dominated by first names like Sam, Jack, Emma. Notable quirks: 307 rows literally contain the string \"null\" (not actual nulls, since null_rate is 0.0), duplicate_rate is 12.3% with 1003 repeats, and 5.8% include emoji. Vocabulary is wide (7487 tokens across 8139 rows), consistent with free-form handles rather than a controlled label set.","role":"free_text","scope":"column","target":"display_name","treatment":"Treat as free-text handles: replace literal \"null\" tokens with true missing, lowercase-normalize, and avoid using as a join key given 12% duplicates."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.min","stats.max","stats.median","stats.mean","stats.q1","stats.q3","stats.skew","stats.kurtosis","stats.n_outliers"],"model":"anthropic:claude-opus-4-7","narrative":"Numeric count of rating pages per item, present for roughly 58% of rows (null_rate 0.4168) with 177 distinct values from 1 to 1208 and a median of 25. The distribution is severely right-skewed (skew 11.24, kurtosis 298.34) with 236 outliers above the IQR fence, so the mean of 32.81 sits well above the typical row.","role":"feature","scope":"column","target":"num_ratings_pages","treatment":"log-transform and impute missing before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["stats.min","stats.max","stats.mean","stats.median","stats.skew","stats.kurtosis","stats.q1","stats.q3","stats.n_outliers","stats.outlier_rate","stats.zero_rate","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"num_reviews is a count of reviews per item, ranging from 0 to 17184 with a median of 588 and mean of 868. The distribution is heavily right-skewed (skew 3.92, kurtosis 33.3), with 505 outliers (6.2%) and only 0.96% zeros. The gap between q3 (1130) and max (17184) signals a long tail of highly-reviewed items.","role":"feature","scope":"column","target":"num_reviews","treatment":"log1p-transform before modelling to tame the right tail."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.one_word_rate","stats.duplicate_rate","stats.len_min","stats.len_mean","stats.len_max","stats.allcaps_rate","stats.url_rate","stats.emoji_rate","top_words"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds unique single-token usernames: every one of the 8139 rows has a distinct value (n_unique=8139, duplicate_rate=0.0) and one_word_rate is 1.0. Lengths are short and tightly bounded (len_min=2, len_mean\u22489.79, len_max=15), consistent with a handle field rather than free text. No nulls, no URLs, no emoji, and allcaps usage is negligible (0.00037).","role":"identifier","scope":"column","target":"username","treatment":"Treat as a user identifier; drop from modelling features and use only for joins or deduplication."}],"providers":["anthropic:claude-opus-4-7"],"total_usage":{"completion_tokens":2071,"prompt_tokens":7667,"total_tokens":9738}},"language_counts":{},"meta":{"generated_at":"2026-05-01T17:51:53+00:00","mode":"full","row_count":8139,"sampled_rows":8139,"seed":42,"source":"/home/coolhand/html/datavis/data_trove/entertainment/movies/letterboxd/users_export.csv"},"notes":[],"saturn_version":"0.2.0","schema":{"_id":"text","display_name":"text","num_ratings_pages":"numeric","num_reviews":"numeric","username":"text"}}
