{"columns":[{"alerts":[],"column":"summons_number","extras":{"histogram":{"counts":[9,1504,0,0,1945,0,0,0,0,0,0,0,0,0,0,0,0,0,4416,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,5,174,1947],"edges":[1124851148.0,1328112264.55,1531373381.1,1734634497.65,1937895614.2,2141156730.75,2344417847.3,2547678963.8500004,2750940080.4,2954201196.95,3157462313.5,3360723430.05,3563984546.6000004,3767245663.15,3970506779.7000003,4173767896.25,4377029012.8,4580290129.35,4783551245.9,4986812362.450001,5190073479.0,5393334595.55,5596595712.1,5799856828.650001,6003117945.200001,6206379061.75,6409640178.3,6612901294.85,6816162411.400001,7019423527.950001,7222684644.5,7425945761.05,7629206877.6,7832467994.150001,8035729110.700001,8238990227.25,8442251343.8,8645512460.35,8848773576.900002,9052034693.45,9255295810.0]},"sample":[1494159016.0,1494551524.0,1494274954.0,1493610430.0,1500442197.0,1491832897.0,1493445443.0,1495714410.0,1502101737.0,1496151100.0,1492939080.0,1495716314.0,1499817484.0,1500810149.0,1494687884.0,1502060863.0,1496492729.0,1497757710.0,1501981675.0,1492438765.0,1502051515.0,1500386340.0,1500386352.0,1493897329.0,1499697491.0,1502765767.0,1499177938.0,1492084580.0,1502338830.0,1495694288.0,1502009640.0,1501798730.0,1494172318.0,1498296660.0,1502552942.0,1490548518.0,1501449540.0,1501547951.0,1486099087.0,1500715712.0,1497846572.0,1502150244.0,1501603863.0,1492007134.0,1501592385.0,1500966575.0,1496092776.0,1496780085.0,1499690496.0,1481069202.0,1490924565.0,1497713523.0,1501207052.0,1489486379.0,1496807935.0,1500797420.0,1493628288.0,1499269134.0,1501002030.0,1491530923.0,1499644231.0,1498977066.0,1474722507.0,1498405927.0,1495100583.0,1496310871.0,1499203950.0,1499269444.0,1496003317.0,1499805524.0,1500534894.0,1492200785.0,1488102193.0,1497856711.0,1498576643.0,1496450784.0,1492108972.0,2028596016.0,2028582121.0,2028548599.0,2028548447.0,2028548435.0,2028548095.0,2028548058.0,2028544790.0,2028544466.0,2028542597.0,2028530248.0,2028530145.0,2028520796.0,2028516549.0,2028516434.0,2028482801.0,2028480014.0,2028476722.0,2028472856.0,2028408261.0,2028413270.0,2028452717.0,2028452754.0,2028462085.0,2028472492.0,2028472650.0,2028281080.0,2028333248.0,2028376958.0,2028377021.0,2028396751.0,2028191030.0,2028192641.0,2028194972.0,2028212779.0,2028221409.0,2028221501.0,2028240854.0,2028243995.0,2028249456.0,2028036930.0,2028055315.0,2028069193.0,2028111215.0,2028136030.0,2028138798.0,2028159534.0,2028177160.0,2028177214.0,2026835020.0,2026835056.0,2027282105.0,2027617942.0,2027686990.0,2027698980.0,2027699016.0,2027743583.0,2027759165.0,2027867247.0,2027888779.0,2027911388.0,2027914924.0,1462139565.0,2014653847.0,2019699760.0,2019699837.0,2022996987.0,2022997013.0,2024491870.0,2024564720.0,2025345331.0,2025469676.0,2025469792.0,2026133852.0,2026455727.0,2026757999.0,2027891420.0,2027891535.0,2027891547.0,2027899765.0,2027981159.0,2028025396.0,2028055182.0,2028423250.0,2028688040.0,2001668065.0,2024307541.0,2026581782.0,2027164108.0,2027222078.0,2027236375.0,2027412130.0,2027420149.0,9255295639.0,9254936236.0,9254936224.0,9254935992.0,9254935852.0,9254930465.0,9254930350.0,9254445186.0,9254445320.0,9254507398.0,9254507416.0,9254775332.0,9254930131.0,9254930258.0,9254034058.0,9254186909.0,9254275098.0,9254275190.0,9254341060.0,9254341083.0,9253577290.0,9253622325.0,9253622350.0,9253672444.0,9253688208.0,9253688294.0,9253735594.0,9252483615.0,9252903665.0,9252903689.0,9252903800.0,9252903859.0,9252917056.0,9252917070.0,9253112300.0,9253112347.0,9253248373.0,9253353569.0,9253390311.0,9253390372.0,9253500888.0,9253500920.0,9253501017.0,9253501029.0,9253501080.0,9253501133.0,9253525680.0,9253525897.0,9253525903.0,9251772563.0,9251803470.0,9251803559.0,9251803754.0,9251859310.0,9251885813.0,9252005626.0,9252110240.0,9252110318.0,9252110331.0,9252335377.0,9252442765.0,9250492765.0,9250492868.0,9250492881.0,9250529867.0,9250574034.0,9250807533.0,9250807570.0,9250807600.0,9250949133.0,9251046852.0,9251046864.0,9251046888.0,9248309460.0,9248323686.0,9248404339.0,9248539464.0,9248539490.0,9248539658.0,9248629600.0,9249520694.0,9249804088.0,9249804167.0,9249984601.0,9250210541.0,9243513151.0,9245359268.0,9246472860.0,9247592641.0,9248103261.0,9248103406.0,9248177785.0,9248309392.0,9136829663.0,9166121528.0,9166121590.0,9173259056.0,9213047332.0,9213047435.0,9218793421.0,9231168320.0,9239219158.0,9239219195.0,9241369589.0,9241841965.0,4976290967.0,4976291030.0,4976291080.0,4976291170.0,4976291443.0,8904161137.0,8904161186.0,8971746828.0,8971747201.0,8971747237.0,4976288936.0,4976289096.0,4976289540.0,4976289862.0,4976289928.0,4976290281.0,4976286563.0,4976287014.0,4976287166.0,4976287178.0,4976287580.0,4976288018.0,4976288020.0,4976288110.0,4976288122.0,4976288298.0,4976284359.0,4976284360.0,4976284396.0,4976284475.0,4976284542.0,4976284608.0,4976285479.0,4976285741.0,4976286241.0,4976281966.0,4976282107.0,4976282156.0,4976282703.0,4976282740.0,4976282995.0,4976283010.0,4976283148.0,4976283276.0,4976283410.0,4976283550.0,4976283562.0,4976284128.0,4976284141.0,4976280275.0,4976280433.0,4976280585.0,4976280664.0,4976280858.0,4976280895.0,4976281050.0,4976281140.0,4976281188.0,4976281231.0,4976281784.0,4976278153.0,4976278220.0,4976278440.0,4976278463.0,4976278797.0,4976278920.0,4976279297.0,4976279480.0,4976279911.0,4976275954.0,4976276193.0,4976276478.0,4976276582.0,4976276636.0,4976276764.0,4976277628.0,4976277641.0,4976277800.0,4976277823.0,4976277963.0,4976273726.0,4976273829.0,4976274184.0,4976274469.0,4976274548.0,4976274706.0,4976274883.0,4976275528.0,4976275670.0,4976275747.0,4976275759.0,4976275784.0,4976271456.0,4976271500.0,4976271523.0,4976271547.0,4976271870.0,4976272023.0,4976272138.0,4976272291.0,4976272321.0,4976272497.0,4976272655.0,4976272734.0,4976272977.0,4976273179.0,4976273283.0,4976273301.0,4976273416.0,4976269279.0,4976269401.0,4976269449.0,4976269681.0,4976269784.0,4976269838.0,4976269887.0,4976269966.0,4976270221.0,4976270440.0,4976270543.0,4976270701.0,4976267635.0,4976267740.0,4976268007.0,4976268032.0,4976268287.0,4976268421.0,4976268639.0,4976268846.0,4976268901.0,4976265250.0,4976265262.0,4976265286.0,4976265389.0,4976265407.0,4976265663.0,4976266199.0,4976266448.0,4976267052.0,4976267064.0,4976267301.0,4976262881.0,4976263022.0,4976263149.0,4976263150.0,4976263423.0,4976263630.0,4976264099.0,4976264208.0,4976264221.0,4976264749.0,4976260902.0,4976261062.0,4976261670.0,4976262200.0,4976262571.0,4976258506.0,4976258592.0,4976258660.0,4976259134.0,4976259481.0,4976259699.0,4976259808.0,4976259810.0,4976259869.0,4976260082.0,4976260112.0,4976260161.0,4976260227.0,4976260549.0,4976256662.0,4976257502.0,4976257617.0,4976257848.0,4976258336.0,4976255396.0,4976255633.0,4976255657.0,4976255797.0,4976255803.0,4976256157.0,4976256194.0,4976252309.0,4976252358.0,4976252383.0,4976252528.0,4976252747.0,4976252760.0,4976252954.0,4976253028.0,4976253120.0,4976253387.0,4976253405.0,4976253480.0,4976253806.0,4976254460.0,4976254471.0,4976250349.0,4976250817.0,4976250830.0,4976251020.0,4976251081.0,4976251408.0,4976251512.0,4976251524.0,4976251573.0,4976251846.0,4976251925.0,4976252012.0,4976252097.0,4976247363.0,4976248306.0,4976248460.0,4976248616.0,4976248641.0,4976249300.0,4976249372.0,4976249487.0,4976249591.0,4976249657.0,4976249724.0,4976245081.0,4976245172.0,4976245366.0,4976245561.0]},"kind":"numeric","n":10000,"n_null":0,"n_unique":10000,"null_rate":0.0,"stats":{"iqr":2948110270.25,"kurtosis":-0.9134755351123687,"max":9255295810.0,"mean":4778744249.9537,"median":4976262516.0,"min":1124851148.0,"n_outliers":0,"outlier_rate":0.0,"q1":2028177479.0,"q3":4976287749.25,"skew":0.46808442893097224,"std":2705973234.5077815,"zero_rate":0.0}},{"alerts":[{"code":"long_tail","level":"info","message":"368 singleton categories"}],"column":"issue_date","extras":{"singletons":368,"top_values":[["2025-12-28T00:00:00.000",6542],["2025-12-30T00:00:00.000",1594],["2025-12-29T00:00:00.000",356],["2026-06-26T00:00:00.000",14],["2026-09-27T00:00:00.000",13],["2026-09-25T00:00:00.000",12],["2025-12-31T00:00:00.000",12],["2026-06-27T00:00:00.000",11],["2026-10-25T00:00:00.000",10],["2026-08-31T00:00:00.000",10],["2026-08-27T00:00:00.000",10],["2026-07-26T00:00:00.000",10],["2026-06-30T00:00:00.000",10],["2026-08-25T00:00:00.000",9],["2026-10-29T00:00:00.000",8],["2026-10-17T00:00:00.000",8],["2026-10-05T00:00:00.000",8],["2026-09-23T00:00:00.000",8],["2026-07-27T00:00:00.000",8],["2026-07-24T00:00:00.000",8]]},"kind":"categorical","n":10000,"n_null":0,"n_unique":687,"null_rate":0.0,"stats":{"cardinality":687,"entropy":2.764998092524379,"entropy_ratio":0.2933944507966807,"top_rate":0.6542,"top_value":"2025-12-28T00:00:00.000"}},{"alerts":[{"code":"outliers","level":"warn","message":"10.1% rows beyond 1.5 IQR"}],"column":"violation_code","extras":{"histogram":{"counts":[9,0,48,38,858,216,412,1483,14,6,0,3,4,4426,4,880,0,376,27,162,24,3,0,4,28,7,185,105,117,121,14,76,57,14,21,0,0,2,2,254],"edges":[4.0,6.375,8.75,11.125,13.5,15.875,18.25,20.625,23.0,25.375,27.75,30.125,32.5,34.875,37.25,39.625,42.0,44.375,46.75,49.125,51.5,53.875,56.25,58.625,61.0,63.375,65.75,68.125,70.5,72.875,75.25,77.625,80.0,82.375,84.75,87.125,89.5,91.875,94.25,96.625,99.0]},"sample":[78.0,98.0,37.0,40.0,14.0,19.0,14.0,40.0,40.0,17.0,20.0,40.0,14.0,14.0,14.0,98.0,40.0,68.0,46.0,19.0,40.0,98.0,40.0,46.0,14.0,21.0,40.0,98.0,40.0,74.0,40.0,14.0,46.0,40.0,67.0,51.0,14.0,17.0,67.0,14.0,46.0,46.0,45.0,98.0,46.0,14.0,67.0,20.0,20.0,16.0,14.0,40.0,40.0,14.0,51.0,46.0,98.0,14.0,67.0,40.0,46.0,98.0,51.0,17.0,40.0,17.0,46.0,46.0,40.0,21.0,74.0,19.0,40.0,72.0,40.0,14.0,98.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,14.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,21.0,40.0,21.0,21.0,66.0,66.0,14.0,21.0,21.0,21.0,21.0,14.0,20.0,21.0,21.0,21.0,66.0,66.0,21.0,66.0,14.0,21.0,21.0,21.0,21.0,21.0,80.0,66.0,80.0,40.0,85.0,98.0,66.0,21.0,78.0,85.0,66.0,14.0,40.0,78.0,40.0,40.0,66.0,74.0,98.0,14.0,40.0,40.0,14.0,14.0,20.0,20.0,4.0,19.0,14.0,40.0,14.0,46.0,22.0,14.0,14.0,71.0,14.0,40.0,50.0,40.0,14.0,19.0,14.0,40.0,40.0,16.0,16.0,16.0,16.0,40.0,14.0,20.0,17.0,74.0,70.0,40.0,14.0,20.0,20.0,40.0,40.0,40.0,40.0,17.0,17.0,40.0,40.0,40.0,40.0,40.0,16.0,18.0,61.0,46.0,19.0,46.0,14.0,20.0,46.0,46.0,70.0,10.0,33.0,70.0,70.0,17.0,40.0,40.0,56.0,40.0,74.0,14.0,14.0,14.0,14.0,14.0,70.0,76.0,14.0,70.0,19.0,14.0,14.0,14.0,64.0,70.0,74.0,71.0,11.0,22.0,71.0,14.0,19.0,14.0,31.0,16.0,19.0,18.0,46.0,46.0,17.0,16.0,36.0,36.0,36.0,36.0,36.0,40.0,13.0,14.0,14.0,20.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0,36.0]},"kind":"numeric","n":10000,"n_null":0,"n_unique":62,"null_rate":0.0,"stats":{"iqr":15.0,"kurtosis":2.9859603501699548,"max":99.0,"mean":35.8522,"median":36.0,"min":4.0,"n_outliers":1007,"outlier_rate":0.1007,"q1":21.0,"q3":36.0,"skew":1.5141769129369393,"std":17.549180964798712,"zero_rate":0.0}},{"alerts":[],"column":"violation_description","extras":{"singletons":10,"top_values":[["PHTO SCHOOL ZN SPEED VIOLATION",4416],["No Parking Street Cleaning",1428],["14-No Standing",598],["40-Fire Hydrant",463],["20A-No Parking (Non-COM)",131],["19-No Stand (bus stop)",123],["16A-No Std (Com Veh) Non-COM",117],["46A-Double Parking (Non-COM)",106],["Detached Trailer",105],["Fire Hydrant",94],["71A-Insp Sticker Expired (NYS)",77],["70A-Reg. Sticker Expired (NYS)",66],["No Standing",61],["Missing Equipment",56],["50-Crosswalk",53],["74-Missing Display Plate",39],["13-No Stand (taxi stand)",38],["17-No Stand (exc auth veh)",38],["Double Parking",32],["98-Obstructing Driveway",31]]},"kind":"categorical","n":10000,"n_null":1513,"n_unique":74,"null_rate":0.1513,"stats":{"cardinality":74,"entropy":2.807939732895211,"entropy_ratio":0.4522040133899608,"top_rate":0.5203252032520326,"top_value":"PHTO SCHOOL ZN SPEED VIOLATION"}},{"alerts":[{"code":"multilingual","level":"info","message":"28 languages detected in sample"},{"code":"allcaps","level":"info","message":"77.3% rows are all-caps"},{"code":"duplicates","level":"warn","message":"68.8% duplicate strings"}],"column":"street_name","extras":{"language_counts":{"__engine":"fasttext:4,612","ar":14,"ca":14,"cs":10,"da":1,"de":56,"en":3596,"es":86,"eu":5,"fr":39,"gl":1,"id":4,"it":21,"ja":614,"ko":14,"lt":1,"mk":1,"ms":1,"nl":25,"no":9,"pl":3,"pt":15,"ro":1,"ru":12,"sv":1,"te":1,"uk":8,"zh":59},"language_sample_size":5000,"length_histogram":{"counts":[1,0,9,0,15,0,150,0,105,0,0,533,0,727,0,1009,0,396,0,0,415,0,374,0,489,0,404,0,344,0,0,155,0,90,0,111,0,1013,0,3656],"edges":[2.0,2.45,2.9,3.35,3.8,4.25,4.7,5.15,5.6,6.05,6.5,6.95,7.4,7.8500000000000005,8.3,8.75,9.2,9.65,10.1,10.55,11.0,11.450000000000001,11.9,12.35,12.8,13.25,13.700000000000001,14.15,14.6,15.05,15.5,15.950000000000001,16.4,16.85,17.3,17.75,18.2,18.650000000000002,19.1,19.55,20.0]},"near_unique":false,"sample":["BEACH 145 ST","WB HYLAN BLVD @ LUTE","NB KNAPP ST @ ALLEN","EB NORTHERN BLVD @ A","E 45th St","EB FOREST AVE @ CRYS","10th Ave","SB WATERS PL @ BRONX","WB SEAGIRT BLVD @ B","S/W C/O 173 ST","SB WINCHESTER BLVD @","Queens Blvd","RECTOR PLACE","PENELOPE AVE","DEAN STREET","MOTT AVENUE","SHORE FRONT PKY","EB FOUR CORNERS RD @","WB GOETHALS RD N @ J","E 60th St","79 STREET","FOWLER AVE","PROSPECT PLACE","MARION AVE","NB LITTLE NECK PKWY","WB SHORE PKWY @ KNAP","9th Ave","ATLANTIC AVENUE","VERMONT AVE","WB SHORE PKWY @ BROW","EB CROSS BRONX EXPWY","SB BRUCKNER BLVD @ W","WB UNION TRPK @ 213T","Gulf Ave","Sea Breeze Ave","43rd Ave","WB NORTHERN BLVD @ 8","E 223rd St","Lexington Ave","Broad St","NB BAILEY AVE @ W 19","WB QUEENS BLVD @ IRE","EAST 19 STREET","NB OCEAN PKWY @ ELMW","EB E TREMONT AVE @ C","NB WOODHAVEN BLVD @","WEST 137 STREET","Nicholas Ave","65 STREET","SB MAIN ST @ 82ND DR"],"top_values":[["SB CROSS BAY BLVD @",115],["WB N CONDUIT AVE @ 8",76],["BROADWAY",49],["WB ASTORIA BLVD N @",47],["NB WOODHAVEN BLVD @",47],["NB SPRINGFIELD BLVD",46],["EB CROSS BRONX EXPWY",44],["WB N CONDUIT AVE @ 1",44],["NB FRANCIS LEWIS BLV",44],["NB SOUTHERN BLVD @ C",43],["SB HAMILTON AVE @ BU",43],["EB BRUCKNER BLVD @ W",42],["NB CROSS BAY BLVD @",41],["6th Ave",39],["EB NORTHERN BLVD @ A",39],["EB SHORE PKWY @ OCEA",39],["SB FRANCIS LEWIS BLV",38],["W 42nd St",34],["EB S CONDUIT AVE @ M",34],["EASTERN PARKWAY",33]],"top_words":[["@",3809],["ave",2506],["st",2287],["blvd",1255],["sb",1180],["wb",1137],["nb",1118],["street",1002],["eb",982],["avenue",760],["w",749],["e",720],["pkwy",409],["rd",364],["west",320],["s",283],["conduit",283],["n",256],["bay",229],["cross",227],["park",180],["ocean",173],["pl",168],["queens",160],["east",143]],"vocab_skipped":null,"word_histogram":{"counts":[137,0,0,0,0,3855,0,0,0,0,1547,0,0,0,0,810,0,0,0,0,2564,0,0,0,0,1014,0,0,0,69],"edges":[1.0,1.2,1.4,1.6,1.8,2.0,2.2,2.4000000000000004,2.6,2.8,3.0,3.2,3.4000000000000004,3.6,3.8000000000000003,4.0,4.2,4.4,4.6,4.800000000000001,5.0,5.2,5.4,5.6000000000000005,5.800000000000001,6.0,6.2,6.4,6.6000000000000005,6.800000000000001,7.0]}},"kind":"text","n":10000,"n_null":4,"n_unique":3115,"null_rate":0.0004,"stats":{"allcaps_rate":0.7732092837134854,"boilerplate_rate":0.0,"duplicate_rate":0.688375350140056,"emoji_rate":0.0,"len_max":20,"len_mean":14.871748699479792,"len_median":16.0,"len_min":2,"len_p95":20.0,"n_duplicates":6881,"n_empty":0,"one_word_rate":0.013705482192877151,"readability_flesch_mean":62.54637500000002,"url_rate":0.0,"vocab_size":1760,"word_mean":3.512905162064826,"word_median":3.0}},{"alerts":[],"column":"vehicle_make","extras":{"singletons":45,"top_values":[["HONDA",1331],["TOYOT",1302],["NISSA",770],["FORD",603],["BMW",559],["ME/BE",521],["JEEP",450],["CHEVR",449],["HYUND",365],["SUBAR",273],["KIA",268],["LEXUS",268],["MAZDA",257],["AUDI",242],["ACURA",221],["VOLKS",199],["DODGE",175],["TESLA",152],["INFIN",151],["GMC",134]]},"kind":"categorical","n":10000,"n_null":78,"n_unique":126,"null_rate":0.0078,"stats":{"cardinality":126,"entropy":4.660590063008295,"entropy_ratio":0.6679666165193021,"top_rate":0.13414634146341464,"top_value":"HONDA"}},{"alerts":[],"column":"vehicle_color","extras":{"singletons":36,"top_values":[["GY",2079],["BK",1784],["WH",1579],["BL",631],["RD",348],["WHITE",347],["BLK",275],["BLACK",273],["GREY",239],["GRY",167],["GR",148],["BLUE",131],["RED",124],["GRAY",113],["SILVE",99],["WHT",65],["YW",62],["BR",60],["WHI",57],["BLU",46]]},"kind":"categorical","n":10000,"n_null":943,"n_unique":99,"null_rate":0.0943,"stats":{"cardinality":99,"entropy":3.675742078300628,"entropy_ratio":0.5544643754971937,"top_rate":0.2295462073534283,"top_value":"GY"}},{"alerts":[{"code":"one_word","level":"warn","message":"100.0% rows are a single word"},{"code":"allcaps","level":"info","message":"100.0% rows are all-caps"},{"code":"short_text","level":"info","message":"95th-percentile length under 20 chars"},{"code":"duplicates","level":"warn","message":"85.7% duplicate strings"}],"column":"violation_time","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,9996,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[4.5,4.525,4.55,4.575,4.6,4.625,4.65,4.675,4.7,4.725,4.75,4.775,4.8,4.825,4.85,4.875,4.9,4.925,4.95,4.975,5.0,5.025,5.05,5.075,5.1,5.125,5.15,5.175,5.2,5.225,5.25,5.275,5.3,5.325,5.35,5.375,5.4,5.425,5.45,5.475,5.5]},"near_unique":false,"sample":["0840P","0259P","1127A","1135A","0622P","0725A","0453P","0939A","1139A","1230P","0826P","1249P","0928A","0245A","0852A","0743A","1232P","1034A","0334A","0131P","0947A","1124P","1148A","0235A","0421P","0156P","0107A","0102A","0230A","0728A","0808P","0556P","0556P","0821A","0849A","0717A","0812A","1238P","0309P","0139P","1232P","0921A","0958A","0919A","0446A","0117A","0120A","1158A","0915A","1040A"],"top_values":[["0839A",29],["0911A",23],["0915A",22],["0845A",22],["1200P",22],["1138A",22],["1151A",22],["0956A",22],["1203P",22],["0248P",21],["0847A",21],["0936A",21],["0941A",21],["1029A",21],["1136A",21],["1142A",21],["0317P",21],["0935A",20],["1001A",20],["1130A",20]],"top_words":[["0839a",29],["0911a",23],["0915a",22],["0845a",22],["1200p",22],["1138a",22],["1151a",22],["0956a",22],["1203p",22],["0248p",21],["0847a",21],["0936a",21],["0941a",21],["1029a",21],["1136a",21],["1142a",21],["0317p",21],["0935a",20],["1001a",20],["1130a",20],["0955a",20],["1015a",20],["1149a",20],["1013a",20],["1147a",20]],"vocab_skipped":null,"word_histogram":{"counts":[9995,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1],"edges":[1.0,1.0333333333333334,1.0666666666666667,1.1,1.1333333333333333,1.1666666666666667,1.2,1.2333333333333334,1.2666666666666666,1.3,1.3333333333333333,1.3666666666666667,1.4,1.4333333333333333,1.4666666666666668,1.5,1.5333333333333332,1.5666666666666667,1.6,1.6333333333333333,1.6666666666666665,1.7,1.7333333333333334,1.7666666666666666,1.8,1.8333333333333335,1.8666666666666667,1.9,1.9333333333333333,1.9666666666666668,2.0]}},"kind":"text","n":10000,"n_null":4,"n_unique":1432,"null_rate":0.0004,"stats":{"allcaps_rate":1.0,"boilerplate_rate":0.0,"duplicate_rate":0.8567426970788315,"emoji_rate":0.0,"len_max":5,"len_mean":5.0,"len_median":5.0,"len_min":5,"len_p95":5.0,"n_duplicates":8564,"n_empty":0,"one_word_rate":0.9998999599839936,"readability_flesch_mean":121.22000000000004,"url_rate":0.0,"vocab_size":1433,"word_mean":1.0001000400160065,"word_median":1.0}},{"alerts":[],"column":"issuing_agency","extras":{"singletons":1,"top_values":[["V",4416],["T",2131],["S",1946],["P",1325],["K",41],["N",38],["A",23],["Y",17],["M",13],["O",9],["C",9],["8",8],["3",6],["X",5],["9",3],["W",3],["L",2],["R",2],["F",2],["U",1]]},"kind":"categorical","n":10000,"n_null":0,"n_unique":20,"null_rate":0.0,"stats":{"cardinality":20,"entropy":2.0073162502379707,"entropy_ratio":0.46444924722660963,"top_rate":0.4416,"top_value":"V"}}],"insights":{"errors":[],"insights":[{"confidence":"high","critiques":[],"evidence_keys":["row_count","column_count","issue_date.top_rate","issue_date.top_value","violation_description.top_rate","violation_description.top_value","violation_description.null_rate","issuing_agency.top_rate","issuing_agency.top_value","vehicle_color.top_values","vehicle_make.top_values","violation_code.outlier_rate","violation_code.skew","street_name.allcaps_rate"],"featured_charts":[{"caption":"Check how dominant school-zone speed violations are versus all other categories.","column":"violation_description","kind":"bar"},{"caption":"See the concentration in agency 'V' and how the remaining agencies split the rest.","column":"issuing_agency","kind":"donut"},{"caption":"Look for duplicate color encodings (WH vs WHITE, BLK vs BLACK vs BK) signalling data-cleaning work.","column":"vehicle_color","kind":"bar"},{"caption":"Inspect the right-skewed distribution and the ~10% of values flagged as outliers.","column":"violation_code","kind":"histogram"},{"caption":"Confirm the expected long tail behind Honda and Toyota among 126 distinct makes.","column":"vehicle_make","kind":"bar"}],"model":"anthropic:claude-opus-4-7","narrative":"This is a 10,000-row sample of NYC-style parking violations with 9 columns covering summons IDs, issue dates and times, locations, violation codes/descriptions, issuing agencies, and vehicle make/color. Two things jump out: issue_date is heavily concentrated on a single day (2025-12-28 accounts for 65% of rows), and violation_description is dominated by 'PHTO SCHOOL ZN SPEED VIOLATION' at 52% of non-null values, paired with issuing_agency 'V' at 44% \u2014 suggesting the sample is skewed toward automated school-zone camera tickets. Vehicle_color also shows clear data-quality issues, with the same color appearing under multiple codes (e.g., WH/WHITE, BLK/BLACK/BK, GREY/GRY) that would need normalization before analysis. Violation_code is numeric with a ~10% outlier rate and right-skew, worth a look alongside the categorical description. Street_name is messy free text with 77% all-caps and many directional prefixes (SB, NB, WB, EB).","scope":"dataset","target":"__global__"},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.std","stats.n_outliers"],"model":"anthropic:claude-opus-4-7","narrative":"Every one of the 10,000 rows carries a distinct value (n_unique = 10000, null_rate = 0.0), and the magnitudes (min 1.12e9, max 9.26e9) match the size of NYC parking summons numbers. The wide spread (std \u2248 2.71e9) and lack of outliers reflect identifier allocation rather than a measurable quantity. Despite being typed numeric, no arithmetic interpretation applies.","role":"identifier","scope":"column","target":"summons_number","treatment":"drop from modelling; retain only as a row key for joins."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This is an issue_date column stored as ISO datetime strings, treated here as categorical across 687 distinct days with no nulls. The distribution is severely concentrated: 65.42% of all 10000 rows fall on 2025-12-28, with another 1594 on 2025-12-30 and 356 on 2025-12-29, meaning roughly 85% of issuance clusters in late December 2025 before tapering into a long tail through 2026. Entropy ratio of 0.29 confirms the heavy skew, and the year-end spike looks like a backfill or batch-load artifact worth confirming before treating this as a true event date.","role":"timestamp","scope":"column","target":"issue_date","treatment":"Parse to datetime and bucket by month or week; investigate the 2025-12-28 spike before using as a feature."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.q1","stats.median","stats.q3","stats.iqr","stats.skew","stats.kurtosis","stats.outlier_rate","stats.n_outliers"],"model":"anthropic:claude-opus-4-7","narrative":"This is almost certainly a categorical violation code stored as a number, with 62 distinct values across 10,000 rows and no nulls. Despite the numeric type, the distribution is meaningless as a quantity: values span 4 to 99, the IQR runs 21\u201336, and 10.07% of rows (1,007) flag as outliers under a numeric rule, with skew 1.51 and kurtosis 2.99. Median equals Q3 at 36, suggesting a heavy concentration at one or two dominant codes.","role":"feature","scope":"column","target":"violation_code","treatment":"Treat as categorical and one-hot or target-encode rather than using the raw integer."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Categorical column describing the parking/traffic violation issued, with 74 distinct codes across 10000 rows. It is heavily concentrated: 'PHTO SCHOOL ZN SPEED VIOLATION' alone covers 52.03% of records, with 'No Parking Street Cleaning' a distant second at 1428, yielding low entropy ratio 0.452. Note 15.13% of values are null, and the labels mix numeric-prefixed legal codes (e.g. '14-No Standing') with free-form descriptions like 'Fire Hydrant', some of which appear to duplicate the coded versions ('40-Fire Hydrant' vs 'Fire Hydrant').","role":"feature","scope":"column","target":"violation_description","treatment":"Normalise the coded vs free-text duplicates, then group rare categories before one-hot encoding."},{"confidence":"high","critiques":[],"evidence_keys":["alerts","n","n_unique","null_rate","stats.duplicate_rate","stats.allcaps_rate","stats.len_max","stats.len_p95","top_values","top_words","language_counts"],"model":"anthropic:claude-opus-4-7","narrative":"Street-name strings, mostly truncated NYC traffic-camera or incident locations like 'SB CROSS BAY BLVD @' with directional prefixes (sb/wb/nb/eb) and '@' delimiters dominating the top words. Values are heavily repeated (68.8% duplicate rate, only 3,115 uniques in 10,000 rows) and 77.3% are all-caps; lengths cap sharply at 20 characters, suggesting upstream truncation. Language detection flags ja (614) and zh (59) alongside 3,596 en, but this is almost certainly a false positive on short ALL-CAPS abbreviations rather than genuine multilingual content.","role":"feature","scope":"column","target":"street_name","treatment":"Normalise case, split off the directional prefix and the '@' cross-street, and treat as a categorical location feature."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","stats.cardinality","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Categorical vehicle manufacturer codes, with HONDA leading at 13.4% of 9,922 non-null rows and TOYOT close behind at 1,302. Values appear truncated to 5 characters (TOYOT, NISSA, ME/BE, CHEVR, HYUND, SUBAR), which will fragment any join against full make names. Cardinality is 126 with entropy ratio 0.668, indicating a long but moderately concentrated tail, and nulls are negligible at 0.78%.","role":"feature","scope":"column","target":"vehicle_make","treatment":"Normalize the truncated codes to canonical make names, then target- or frequency-encode for modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Vehicle color codes, but encoded inconsistently: short codes like GY (2079), BK (1784), WH (1579) coexist with verbose forms WHITE (347), BLACK (273), GREY (239), and alternate abbreviations BLK (275), GRY (167) for the same underlying colors. With 99 distinct values across 10000 rows and a 9.43% null rate, the cardinality is inflated by these duplicate encodings rather than true diversity. Entropy ratio of 0.55 reflects a heavy concentration in the gray/black/white tail.","role":"feature","scope":"column","target":"vehicle_color","treatment":"Normalize synonymous codes (e.g., BK/BLK/BLACK \u2192 black) before one-hot or target encoding."},{"confidence":"high","critiques":[],"evidence_keys":["stats.len_min","stats.len_max","stats.len_mean","stats.allcaps_rate","stats.one_word_rate","stats.duplicate_rate","n_unique","null_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column encodes time-of-day stamps in a compact HHMM+AM/PM format (e.g. '0839A', '1200P'), with every value exactly 5 characters and uppercase. Duplication is high (85.67%) across 1,432 unique stamps, which is expected for clock times sampled across 10,000 records. Null rate is negligible (0.0004) and there are no empty strings.","role":"timestamp","scope":"column","target":"violation_time","treatment":"Parse the HHMMa/p format into a proper time-of-day (minutes since midnight) before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Single-letter codes for the agency issuing each record, drawn from a closed set of 20 values with no nulls. Distribution is heavily concentrated: 'V' alone covers 44.16% (4,416/10,000) and the top four codes (V, T, S, P) account for the bulk of rows, while letters like K, N, A, Y, M, O appear fewer than 50 times each. Entropy ratio of 0.46 confirms the imbalance.","role":"feature","scope":"column","target":"issuing_agency","treatment":"One-hot encode the top categories and bucket the long tail into 'other' before modelling."}],"providers":["anthropic:claude-opus-4-7"],"total_usage":{"completion_tokens":3707,"prompt_tokens":13047,"total_tokens":16754}},"language_counts":{"ar":14,"ca":14,"cs":10,"da":1,"de":56,"en":3596,"es":86,"eu":5,"fr":39,"gl":1,"id":4,"it":21,"ja":614,"ko":14,"lt":1,"mk":1,"ms":1,"nl":25,"no":9,"pl":3,"pt":15,"ro":1,"ru":12,"sv":1,"te":1,"uk":8,"zh":59},"meta":{"generated_at":"2026-05-01T18:05:35+00:00","mode":"full","row_count":10000,"sampled_rows":10000,"seed":42,"source":"/home/coolhand/html/datavis/data_trove/data/urban/parking_violations_sample.csv"},"notes":[],"saturn_version":"0.2.0","schema":{"issue_date":"categorical","issuing_agency":"categorical","street_name":"text","summons_number":"numeric","vehicle_color":"categorical","vehicle_make":"categorical","violation_code":"numeric","violation_description":"categorical","violation_time":"text"}}
