{"columns":[{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"brands_tags","extras":{},"kind":"unknown","n":77145,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"categories_tags","extras":{},"kind":"unknown","n":77145,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"countries_tags","extras":{},"kind":"unknown","n":77145,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"near_unique","level":"info","message":"100.0% of rows are unique strings"},{"code":"one_word","level":"warn","message":"100.0% rows are a single word"},{"code":"url_heavy","level":"info","message":"100.0% rows contain a URL"},{"code":"null_rate","level":"warn","message":"39.0% null"}],"column":"image_url","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[2,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,36226,0,10558,163,0,4,0,0,0,33,0,3,0,11,0,8,0,9,0,3,0,13,1],"edges":[75.0,75.525,76.05,76.575,77.1,77.625,78.15,78.675,79.2,79.725,80.25,80.775,81.3,81.825,82.35,82.875,83.4,83.925,84.45,84.975,85.5,86.025,86.55,87.075,87.6,88.125,88.65,89.175,89.7,90.225,90.75,91.275,91.8,92.325,92.85,93.375,93.9,94.425,94.95,95.475,96.0]},"near_unique":true,"sample":["https://images.openfoodfacts.org/images/products/323/624/007/0405/front_fr.115.400.jpg","https://images.openfoodfacts.org/images/products/007/739/787/8017/front_en.3.400.jpg","https://images.openfoodfacts.org/images/products/359/671/053/7884/front_fr.40.400.jpg","https://images.openfoodfacts.org/images/products/085/004/234/2022/front_en.3.400.jpg","https://images.openfoodfacts.org/images/products/942/101/808/0418/front_en.8.400.jpg","https://images.openfoodfacts.org/images/products/734/000/540/7118/front_en.3.400.jpg","https://images.openfoodfacts.org/images/products/004/126/814/0336/front_en.6.400.jpg","https://images.openfoodfacts.org/images/products/348/130/033/4021/front_en.3.400.jpg","https://images.openfoodfacts.org/images/products/002/795/814/3481/front_en.3.400.jpg","https://images.openfoodfacts.org/images/products/408/860/045/7420/front_en.15.400.jpg","https://images.openfoodfacts.org/images/products/081/074/503/1784/front_en.3.400.jpg","https://images.openfoodfacts.org/images/products/019/347/600/1463/front_en.7.400.jpg","https://images.openfoodfacts.org/images/products/235/037/300/4203/front_es.3.400.jpg","https://images.openfoodfacts.org/images/products/611/126/668/0388/front_fr.3.400.jpg","https://images.openfoodfacts.org/images/products/000/002/084/5858/front_en.12.400.jpg","https://images.openfoodfacts.org/images/products/000/002/068/2712/front_de.4.400.jpg","https://images.openfoodfacts.org/images/products/802/784/200/1738/front_it.11.400.jpg","https://images.openfoodfacts.org/images/products/074/639/543/3046/front_fr.3.400.jpg","https://images.openfoodfacts.org/images/products/502/125/491/0452/front_en.3.400.jpg","https://images.openfoodfacts.org/images/products/354/477/000/2767/front_fr.3.400.jpg","https://images.openfoodfacts.org/images/products/335/860/441/0006/front_fr.33.400.jpg","https://images.openfoodfacts.org/images/products/590/620/751/0074/front_pl.53.400.jpg","https://images.openfoodfacts.org/images/products/848/001/013/9204/front_es.26.400.jpg","https://images.openfoodfacts.org/images/products/590/082/002/0781/front_en.3.400.jpg","https://images.openfoodfacts.org/images/products/076/069/501/7201/front_en.3.400.jpg","https://images.openfoodfacts.org/images/products/023/992/001/2538/front_fr.3.400.jpg","https://images.openfoodfacts.org/images/products/408/870/002/8063/front_en.3.400.jpg","https://images.openfoodfacts.org/images/products/406/145/804/4479/front_de.3.400.jpg","https://images.openfoodfacts.org/images/products/731/086/500/8084/front_sv.15.400.jpg","https://images.openfoodfacts.org/images/products/027/184/610/5277/front_en.3.400.jpg","https://images.openfoodfacts.org/images/products/084/654/701/6261/front_en.3.400.jpg","https://images.openfoodfacts.org/images/products/003/575/131/8074/front_en.3.400.jpg","https://images.openfoodfacts.org/images/products/009/843/724/0953/front_en.3.400.jpg","https://images.openfoodfacts.org/images/products/480/021/613/0012/front_fr.3.400.jpg","https://images.openfoodfacts.org/images/products/409/920/001/8904/front_de.14.400.jpg","https://images.openfoodfacts.org/images/products/001/115/050/2078/front_en.8.400.jpg","https://images.openfoodfacts.org/images/products/880/115/572/9837/front_en.3.400.jpg","https://images.openfoodfacts.org/images/products/762/370/018/4622/front_fr.7.400.jpg","https://images.openfoodfacts.org/images/products/007/184/005/0814/front_en.16.400.jpg","https://images.openfoodfacts.org/images/products/002/654/205/7333/front_en.4.400.jpg","https://images.openfoodfacts.org/images/products/076/023/626/1407/front_en.3.400.jpg","https://images.openfoodfacts.org/images/products/022/159/810/5278/front_en.3.400.jpg","https://images.openfoodfacts.org/images/products/409/920/020/2020/front_fr.3.400.jpg","https://images.openfoodfacts.org/images/products/003/003/496/4245/front_en.16.400.jpg","https://images.openfoodfacts.org/images/products/021/974/102/8864/front_en.3.400.jpg","https://images.openfoodfacts.org/images/products/020/126/201/3405/front_en.3.400.jpg","https://images.openfoodfacts.org/images/products/505/478/170/1644/front_en.3.400.jpg","https://images.openfoodfacts.org/images/products/007/750/700/0109/front_en.3.400.jpg","https://images.openfoodfacts.org/images/products/800/163/725/9887/front_fr.4.400.jpg","https://images.openfoodfacts.org/images/products/005/974/999/5504/front_en.16.400.jpg"],"top_values":[],"top_words":[["https://images.openfoodfacts.org/images/products/809/507/300/522001927/front_es.3.400.jpg",2],["https://images.openfoodfacts.org/images/products/007/417/546/4271/front_en.4.400.jpg",1],["https://images.openfoodfacts.org/images/products/001/800/042/6010/front_en.3.400.jpg",1],["https://images.openfoodfacts.org/images/products/425/017/941/9615/front_de.5.400.jpg",1],["https://images.openfoodfacts.org/images/products/225/166/301/4103/front_fr.4.400.jpg",1],["https://images.openfoodfacts.org/images/products/380/000/200/3904/front_bg.4.400.jpg",1],["https://images.openfoodfacts.org/images/products/000/000/516/1577/front_en.3.400.jpg",1],["https://images.openfoodfacts.org/images/products/359/671/052/7304/front_fr.35.400.jpg",1],["https://images.openfoodfacts.org/images/products/230/365/830/5793/front_en.4.400.jpg",1],["https://images.openfoodfacts.org/images/products/239/060/030/1804/front_nb.8.400.jpg",1],["https://images.openfoodfacts.org/images/products/628/102/030/1030/front_en.3.400.jpg",1],["https://images.openfoodfacts.org/images/products/405/648/948/2970/front_de.5.400.jpg",1],["https://images.openfoodfacts.org/images/products/761/326/921/4250/front_fr.3.400.jpg",1],["https://images.openfoodfacts.org/images/products/762/318/633/9790/front_fr.11.400.jpg",1],["https://images.openfoodfacts.org/images/products/075/887/032/7313/front_en.3.400.jpg",1],["https://images.openfoodfacts.org/images/products/323/107/013/0053/front_fr.4.400.jpg",1],["https://images.openfoodfacts.org/images/products/007/789/047/4310/front_en.4.400.jpg",1],["https://images.openfoodfacts.org/images/products/004/970/566/0485/front_en.3.400.jpg",1],["https://images.openfoodfacts.org/images/products/539/069/576/9012/front_en.3.400.jpg",1],["https://images.openfoodfacts.org/images/products/734/000/540/2564/front_sv.9.400.jpg",1],["https://images.openfoodfacts.org/images/products/801/266/650/4213/front_fr.3.400.jpg",1],["https://images.openfoodfacts.org/images/products/000/000/211/9207/front_en.4.400.jpg",1],["https://images.openfoodfacts.org/images/products/376/031/537/3745/front_fr.5.400.jpg",1],["https://images.openfoodfacts.org/images/products/007/789/077/2003/front_en.3.400.jpg",1],["https://images.openfoodfacts.org/images/products/485/004/179/0127/front_en.3.400.jpg",1]],"vocab_skipped":null,"word_histogram":{"counts":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,47036,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"edges":[0.5,0.5333333333333333,0.5666666666666667,0.6,0.6333333333333333,0.6666666666666666,0.7,0.7333333333333334,0.7666666666666666,0.8,0.8333333333333333,0.8666666666666667,0.9,0.9333333333333333,0.9666666666666667,1.0,1.0333333333333332,1.0666666666666667,1.1,1.1333333333333333,1.1666666666666665,1.2,1.2333333333333334,1.2666666666666666,1.3,1.3333333333333335,1.3666666666666667,1.4,1.4333333333333333,1.4666666666666668,1.5]}},"kind":"text","n":77145,"n_null":30109,"n_unique":47035,"null_rate":0.39029101043489534,"stats":{"allcaps_rate":0.0,"boilerplate_rate":0.0,"duplicate_rate":2.1260311250956713e-05,"emoji_rate":0.0,"len_max":96,"len_mean":84.24347308444595,"len_median":84.0,"len_min":75,"len_p95":85.0,"n_duplicates":1,"n_empty":0,"one_word_rate":1.0,"readability_flesch_mean":-811.9179999999999,"url_rate":1.0,"vocab_size":19999,"word_mean":1.0,"word_median":1.0}},{"alerts":[{"code":"multilingual","level":"info","message":"31 languages detected in sample"},{"code":"null_rate","level":"warn","message":"41.9% null"},{"code":"duplicates","level":"warn","message":"31.0% duplicate strings"}],"column":"ingredients_text","extras":{"language_counts":{"__engine":"fasttext:2,197","ar":1,"bg":8,"ca":2,"cs":11,"da":6,"de":128,"el":3,"en":1623,"es":37,"et":1,"fi":8,"fr":212,"hr":5,"hu":4,"it":22,"ja":2,"ko":1,"lt":2,"nl":18,"no":18,"pl":28,"pt":13,"ro":2,"ru":9,"sh":2,"sr":2,"sv":23,"th":1,"tr":2,"uk":2},"language_sample_size":5000,"length_histogram":{"counts":[22912,8740,4217,3155,1952,1268,810,581,378,282,173,115,57,38,37,29,29,7,12,5,3,1,3,2,0,0,1,0,1,1,0,0,0,0,0,1,0,0,0,1],"edges":[0.0,132.075,264.15,396.22499999999997,528.3,660.375,792.4499999999999,924.5249999999999,1056.6,1188.675,1320.75,1452.8249999999998,1584.8999999999999,1716.975,1849.0499999999997,1981.1249999999998,2113.2,2245.2749999999996,2377.35,2509.4249999999997,2641.5,2773.575,2905.6499999999996,3037.725,3169.7999999999997,3301.8749999999995,3433.95,3566.0249999999996,3698.0999999999995,3830.1749999999997,3962.2499999999995,4094.325,4226.4,4358.474999999999,4490.549999999999,4622.625,4754.7,4886.775,5018.849999999999,5150.924999999999,5283.0]},"near_unique":false,"sample":["LAIT 67% issu d'animaux nourris sans OGM (< 0,9%) et CR\u00c8ME 26% pasteuris\u00e9s (Origine : France), ferments LACTIQUES, ail et fines herbes (1.9%), sel, poivre, conservateur : sorbate de potassium. Peut contenir des traces de fruits \u00e0 coque.","Corn meal, vegetable oil (contains one or more of the following: corn, cottonseed, palm, sunflower), cheese blend (maltodextrin, whey, sunflower oil, cheddar cheese [pasteurized milk, cheese culture, salt, enzymes], salt, monosodium glutamate, sodium phosphate, butter [cream, salt], natural flavor, citric acid, lactic acid, yellow 5, yellow 6, enzymes), seasoning (maltodextrin, cheddar cheese [(cultured milk, salt, enzymes), whey, buttermilk, salt, natural flavor, disodium phosphate, lactic acid], whey, spices, onion powder, natural flavors, garlic powder, salt, yeast extract, dehydrated red bell pepper, sodium diacetate, jalapeno pepper powder, malic acid, extractives of paprika [color]), salt.","provolone piccante cheese (milk) (64%), smoked prosciutto (36%) [pork, salt, spices and herbs, sugar, dextrose, preservative (sodium nitrite), antioxidant (sodium ascorbate)]. *made with 103g of pork per 100g of finished product. allergy advice! for allergens, see ingredients in bold. packaged in a protective atmosphere nutrition we suggest this product provides 8 servings typical values per","","ROMANO CHEESE MADE FROM SHEEP'S MILK, CHEESE CULTURE, SALT, ENZYMES, POWDERED CELLULOSE ADDED TO PREVENT CAKING.","Cheddar Cheese (Pasteurized Milk, Cheese Culture, Salt, Enzymes), Whey, Milk Protein Concentrate, Milkfat, Whey Protein Concentrate, Sodium Phosphate, Contains Less Than 2% Of Calcium Phosphate, Salt, Sodium Alginate, Lactic Acid, Sorbic Acid As A Preservative, Apocarotenal (Color), Annatto (Color).","Pasteurized reduced fat milk, cheese culture, salt, enzymes, annatto (vegetable color), vitamin a palmitate.","undefined","cheese whey, water, vegetable oil (canola oil and/or soybean oil and/or sunflower oil), modified corn starch, natural flavours, salt, malto - dextrin, jalapeno peppers, white vinegar, monoso - dium glutamate, cheddar cheese (pasteurized milk, cheese cultures, salt, enzymes), disodium phos - phate, datem, mono - and di-glycerides, acetic acid, colour, contains: milk, huilo","_Leite_ pasteurizado, _nata_ pasteurizada, reguladores de acidez (fosfato diss\u00f3dico, citrato triss\u00f3dico e \u00e1cido c\u00edtrico), amido modificado, estabilizadores (pectina, \u00e1gar-\u00e1gar, carragenina, farinha de sementes de alfarroba e goma de tara), antiaglomerantes (fosfato tric\u00e1lcico e fosfato dic\u00e1lcico), sal, fermentos l\u00e1cteos.","Broccoli, cheese sauce (water, whey, modified corn.starch, cheddar cheese [pasteurized milk, cheese culture, salt, enzymes], contains less than 2% of annatto (vegetable color), citric acid, corn oil, corn syrup acids, creams, disodium guanylate, disodium inosinate, dry vegetable shortening, garlic powder, granular, semisoft, blue cheese [pasteurized milk, cheese culture, salt, enzymes], maltodextrin, onion powder, palm oil, paprika (color), salt, sodium alginate, sodium phosphate, spice, sugar, swiss cheese [pasteurized milk, cheese culture, salt enzymes], unsalted butter [pasteurized cream, natural flavorings], yeast extract).","Sesame seed bun: enriched bleached wheat flour (wheat flour, niacin, reduced iron, thiamine mononitrate, riboflavin, folic acid, enzyme), water, sugar, soybean oil, sesame seeds, contains 2% or less of: yeast (yeast, sorbitan monostearate, ascorbic acid), salt, monoglycerides with ascorbic acid and citric acid (antioxidants), calcium propionate (preservative), calcium sulfate, enzymes, wheat starch, ascorbic acid. fully cooked flame broiled chopped beef steak (smoke flavor added): beef, salt, potassium phosphate, maltodextrin (from corn), modified corn starch, spice, grill flavor (partially hydrogenated soybean/cottonseed oil), corn syrup solids, natural smoke flavor. pasteurized process american cheese: cultured milk, water, cream, sodium citrate, salt, sodium phosphate, sorbic acid (preservative), lactic acid, artificial color, enzymes, soy lecithin.","Flour tortilla (wheat flour, water, whole wheat flour, palm oil, baking powder, cane sugar, salt, guar gum, non-gmo corn starch), cage-free* egg whites (egg whites, whole milk, non-gmo corn starch, sea salt, pepper), chicken apple sausage (skinless chicken thigh, dehydrated apples, water, salt, brown sugar, less than 2% of: spices, flavorings, granulated garlic, natural smoke flavor), white cheddar cheese (pasteurized cultured milk, salt, enzymes), organic white cheddar cheese sauce (water, organic corn starch, salt, organic cane sugar, organic natural cheddar cheese flavor, and 2% or less organic canola oil), organic roasted russet potatoes (organic potatoes with organic olive oil), organic salsa (organic diced tomatoes [organic tomatoes, organic tomato juice, sea salt, naturally derived citric acid, calcium chloride], organic diced onions, organic jalapeno peppers, organic vinegar, organic lime juice, organic scallions, organic cilantro, organic corn starch, sea salt, organic garlic powder, organic cumin, organic black pepper, organic coriander, organic chili powder), organic red peppers, organic scallions, organic corn starch.","skimmed cheese, milk fat, milk proteins, emulsifying salts (E331, E452), salt, preservative (E202)","","63% krumpir, 31% suncokretovo ulje, maltodekstrin, kuhinjska sol, dekstroza, poja\u010diva\u010di arome: mononatrijev glutaminat, dinatrijev guanilat, dinatrijev inozinat, dijatrijevi 5'-ribonukleotidi; sirutka u prahu, arome, 0,2% sir u prahu, mlijeko u prahu, 0,2% luk u prahu, jogurt u prahu, \u0161e\u0107er, \u010de\u0161njak u prahu, regulatori kiselosti: mlije\u010dna kiselina, jabu\u010dna kiselina, limunska kiselina; bojilo: ekstrakt paprike. Mo\u017ee sadr\u017eavati tragove kikirikija, soje i glutena (p\u0161enica).","unbleached wheat flour, enriched flour (wheat flour, niacin, reduced iron, thiamine mononitrate, riboflavin, folic acid), safflower oil, corn starch, palm oil, leavening (baking soda, monocalcium phosphate, ammonium bicarbonate), yeast extract, sunflower lecithin, cane sugar onion powder, garlic powder, lactic acid, calcium lactate, salt, distilled vinegar solids, annatto extract (for color), organic maltodextrin, natural flavor, contains wheat made on the same equipment that processes milk and soy,","","Raclette 49% (_lait_** pasteuris\u00e9 de vache, sel, ferments lactiques (contient _lait_), coagulant microbien, conservateur : natamycine), gouda 49% (_lait_** pasteuris\u00e9 de vache, sel, ferments lactiques (contient _lait_), coagulant microbien), f\u00e9cule de pomme de terre. **Lait origine France.","Romaine lettuce, sweet onion vinaigrette (canola oil, high fructose corn syrup, water, dijon mustard [water, mustard seed, distilled vinegar, salt, white wine, citric acid, turmeric {color}, tartaric acid, spices], onion, red wine vinegar, white wine vinegar, sweet onion [sweet onion, vinegar, salt], salt, lemon juice concentrate, dried onion, spices, xanthan gum, natural smoke flavor), chicken breast (boneless chicken breast, water, contains 2% or less of the following: soy protein concentrate, sodium lactate, salt, modified corn starch, carrageenan, sodium phosphate [preservative]), apples (apples and calcium ascorbate [vitamin c calcium salt]), croutons (enriched flour [wheat flour, malted barley flour, niacin, reduced iron, thiamin mononitrate, riboflavin, folic acid], canola and/or sunflower oil, whey, salt, yeast, 2% or less of high fructose corn syrup, dehydrated parsley, garlic powder, calcium propionate [preservative], natural and artificial flavor, parmesan cheese and enzyme modified cheese [pasteurized milk, cheese cultures, salt, enzymes], cultured nonfat milk, annatto [color], extractives of turmeric and paprika [color], enzymes, ascorbic acid, tbhq [to preserve freshness]), blue cheese crumbles (blue cheese [pasteurized milk, cheese cultures, salt, enzymes, penicillium roquefortii], powdered cellulose [to prevent caking], natamycin [to protect flavor]), radicchio, red onion, carrot, green leaf lettuce.","Pasteurisierte Kuhmilch*, Speisesalz, K\u00e4sereikulturen, mikrobielles Lab. *aus kontrolliert biologischer Landwirtschaft","Wheat Flour [Wheat Flour, Calcium Carbonate, Iron, Niacin, Thiamin)], Mature Cheddar Cheese (with Colour: Annatto) (Milk) (22%), Water, Tomato, Rapeseed Oil, Cornflour, White Wine Vinegar, Pasteurised Egg Yolk, Salt, Yeast, Emulsifiers (Mono - and Di-Glycerides of Fatty Acids, Mono - and Di-Acetyl Tartaric Acid Esters of Mono - and Di-Glycerides of Fatty Acids), Spirit Vinegar, Wheat Gluten, Soya Flour, Mustard Flour, Palm Oil, Flour Treatment Agent (Ascorbic Acid). Cheese and onion: INGREDIENTS Wheat Flour [Wheat Flour, Calcium Carbonate, Iron, Niacin, Thiamin], Water, Mature Cheddar Cheese (Milk) (12%), Red Leicester Cheese (with Colour: Annatto) (Milk) (12%), Onion, Rapeseed Oil, Oatmeal, Oats, Wheat Bran, Cornflour, Full Fat Soft Cheese [Cheese (Milk), Cornflour], White Wine Vinegar, Pasteurised Egg Yolk, Salt, Yeast, Wheat Gluten, Spirit Vinegar, Emulsifiers (Mono - and Di-Glycerides of Fatty Acids, Mono - and Di-Acetyl Tartaric Acid Esters of Mono-and Di-Glycerides of Fatty Acids), Muscovado Sugar, Mustard Flour, Malted Barley Flour, Palm Oil, Flour Treatment Agent (Ascorbic Acid). Cheese and pickle: INGREDIENTS Wheat Flour [Wheat Flour, Calcium Carbonate, Iron, Niacin, Thiamin), Mature Cheddar Cheese (Milk) (28%), Water, Oatmeal, Oats, Sugar, Malt Vinegar (Barley), Carrot, Courgette, Onion, Swede, Wheat Bran, Molasses, Salt, Yeast, Cornflour, Spirit Vinegar, Wheat Gluten, Emulsifiers (Mono - and Di-Glycerides of Fatty Acids, Mono - and Di-Acetyl Tartaric Acid Esters of Mono - and Di-Glycerides of Fatty Acids), Muscovado Sugar, Rapeseed Oil, Malted Barley Flour, Spices, Barley Malt Extract, Concentrated Lemon Juice, Palm Oil, Flour Treatment Agent (Ascorbic Acid), Black Pepper. Allergy Advice For allergens, including cereals containing gluten, see ingredients in bold. The allergens in this product have changed. Suitable for vegetarians. STORAGE Keep refrigerated. NUTRITION","TAPIOCA FLOUR, MILK (MILK, VITAMIN D3), PARMESAN CHEESE (CULTURED PASTEURIZED MILK, SALT, MICROBIAL ENZYMES), CANOLA OIL, EGG, WATER, SEA SALT, WHITE PEPPER.","skummet melk, fl\u00f8te, melkesyrekultur, salt, konserveringsmiddel (kaliumsorbat), l\u00f8pe (mikrobiell)","Cultured milk, enzymes, salt.","Fresh mozzarella: pasteurized milk & cream, vinegar, vegetable enzymes, salt. balsamic dip: concentrated grape juice, balsamic vinegar of modena 35% (wine vinegar, concentrated grape must, caramel color), modified corn starch. caramel color contains sulphites.","Filling: cheddar cheese, mozzarella cheese, green chilies (salt, citric acid, calcium chloride), cheese sauce (modified food starch, maltodextrin, sweet whey powder, salt, natural cheddar cheese flavor, non fat dry milk, natural butter flavor, partially hydrogenated soybean oil, autolyzed yeast extract, yellow #5, yellow #6 lake.) tortilla: wheat enriched flour (flour, niacin, iron, thiamin mononitrate, riboflavin, folic acid), water, vegetable shortening (partially hydrogenated soybean and cotton seed oil), salt, leavening, (sodium bicarbonate, sodium aluminum sulfate, sodium acid pyrophosphate, monocalcium phosphate, sodium aluminum phosphate), xanthan, guar gum, fumaric acid, calcium propionate, l-cysteine hydrochloride.","PASTEURIZED MILK, CHEESE CULTURES, SALT, MICROBIAL RENNET.","","Enriched Corn Meal (Corn Meal, Ferrous Sulfate, Niacin, Thiamin Mononitrate, Riboflavin, Folic Acid), Vegetable Oil (Sunflower, Corn, And/Or Canola Oil), White Cheddar Seasoning (Whey, Cheddar Cheese [Milk, Cheese Cultures, Salt, Enzymes], Canola Oil, Natural And Artificial Flavors, Maltodextrin [Made From Corn], Artificial Color, Salt, Whey Protein Concentrate, Monosodium Glutamate, Lactic Acid, Citric Acid, Acetic Acid), And Salt.","Unbleached enriched flour (wheat flour, malted barley flour, niacin, reduced iron, thiamine mononitrate, riboflavin, folic acid), water, durum flour, semolina, roasted garlic, medium asiago cheese (pasteurized milk, cheese culture, salt, enzymes), asiago fresh cheese (pasteurized milk, cheese culture, salt, enzymes), romano cheese (pasteurized cow's milk, salt, cheese culture, enzymes), salt, parmesan cheese (milk, salt, cheese culture, enzymes), sour culture, maltodextrin, whey, yeast, white degerminated corn meal, olive oil natural flavors, black pepper, ascorbic acid (added as a dough conditioner).","Pasta: wheat flour, water, eggs, beta-carotene. filling: asiago cheese (pasteurized cows milk, cheese cultures, salt, enzymes), ricotta cheese (whey, protein, salt, vinegar), mozzarella cheese (pasteurized whole milk, culture, salt, enzymes), breadcrumbs (wheat flour), parmesan cheese (pasteurized cows milk, cheese culture, salt, enzymes), romano cheese (pasteurized cows milk, cheese culture, salt, enzymes), parmesan flavor (parmesan cheese [paseurized milk, cultures, salt, enzymes], salt, yeast extract, unsalted butter, corn oil, olive oil, cream powder, sugar, natural flavorings), canola oil, parsley, salt, black pepper.","Pasteurized whole milk, salt, enzymes & select cultures","PASTEURIZED MILK AND CREAM, WATER, WHEY PROTEIN CONCENTRATE, MODIFIED CORN STARCH, GARLIC*, SALT, CHEESE CULTURE, SPICE, LACTIC ACID, GUAR GUM, PARSLEY, POTASSIUM SORBATE (PRESERVATIVE), CHIVES, CAROB BEAN GUM, XANTHAN GUM, NATURAL FLAVOR, ENZYMES. *DRIED.","Gepasteuriseerde melk, zout, zuursel (melk), vegetarisch stremsel.","Cultured pasteurized skim milk, pineapple, whey, whey protein concentrate, salt, maltodextrin, modified corn starch, aspartame*, artificial color, natural flavor, guar gum, carrageenan, locust bean gum, sodium citrate, citric acid, potassium sorbate and carbon dioxide (to preserve freshness), vitamin a palmitate and enzyme.","undefined","Aged cheddar cheese (milk, cultures, salt, enzymes), natural smoke flavor, sodium phosphate, potassium sorbate to preserve freshness.","Crust: enriched flour (wheat flour, malted barley flour, niacin, ferrous sulfate, thiamine mononitrate, riboflavin, folic acid), water, soybean oil, sugar, yeast, salt, baking powder (cornstarch, sodium bicarbonate, sodium aluminum sulfate, monocalcium phosphate), degerminated yellow cornmeal, soy flour. sauce: water, tomato paste (tomatoes), seasoning blend (modified cornstarch, salt, dehydrated onion, dehydrated garlic, sugar, spice, soybean oil, contains less than 2% guar gum, parmesan cheese [cultured milk, salt, enzymes], xanthan gum, paprika, citric acid, beet powder [color], soy flour), sugar, modified food starch. mozzarella cheese blend: low moisture part-skim mozzarella cheese (pasteurized milk, cultures, salt, enzymes), mozzarella cheese substitute (water, corn oil, nonfat dry milk, modified food starch, potassium chloride, sodium citrate, sodium aluminum phosphate, sodium tripolyphosphate, tri-calcium phosphate, magnesium oxide, ferric-ortho-phosphate, vitamin a palmitate, niacinamide, zinc oxide, cyanocobalamin, pyridoxine hydrochloride [vitamin b6]).","Tapioca starch, cheese (pasteurized milk, cheese cultures, salt, enzymes), milk, canola oil, eggs, cornstarch, sodium bicarbonate, sodium acid pyrophospate, monocalcium phosphate, salt, garlic","cheddarcheese (cultured pasteurized milk, salt, enzymes, annatto [vegetable color]). anti-caking blend (potato starch, tapioca starch, 0 inhibitor]). contains: milk stributed by: lipari fo arren mi48089 265-9853 liparifoods.com","undefined","Pasteurized sheep's milk, salt, cheese cultures, enzymes.","undefined","undefined","Nonfat Mozzarella Cheese (Pasteurized Skim Milk, Cheese Culture, Salt, Enzymes, Yeast*, Artificial Color, Vitamin A Palmitate); Potato Starch, Cellulose Powder And Calcium Sulfate Added To Prevent Caking; Natamycin (A Natural Mold Inhibitor)","_Leite_ de b\u00fafala (Origem: It\u00e1lia), sal, coalho, penicilium.","PASTEURIZED MILK, CHEESE CULTURE SALT, ENZYMES, POTATO STARCH, CORN STARCH AND CALCIUM SULFATE ADDED TO PREVENT CAKING. NATAMYCIN (MOLD INHIBITOR).","Pasteurized milk, cheese culture, salt, enzymes, annatto color.","Cultured pasteurized milk, salt, enzymes, annatto coloring if colored."],"top_values":[["",4981],["undefined",2553],["Pasteurized milk, cheese culture, salt, enzymes, annatto (vegetable color).",215],["Pasteurized milk, cheese culture, salt, enzymes.",184],["Pasteurized part-skim milk, cheese culture, salt, enzymes.",153],["Pasteurized milk, cheese culture, salt, enzymes, annatto color.",116],["Pasteurized milk, cheese culture, salt, enzymes and annatto (vegetable color).",115],["Pasteurized milk, cheese cultures, salt, enzymes.",103],["Cultured pasteurized milk, salt, enzymes.",89],["Pasteurized milk, cheese culture, salt, enzymes, annatto (color).",60],["Cultured milk, salt, enzymes.",51],["Cultured pasteurized milk, salt, enzymes, annatto color.",51],["Pasteurized milk, vinegar, salt, enzymes.",45],["PASTEURIZED MILK, CHEESE CULTURE, SALT, ENZYMES.",42],["Pasteurized part-skim milk, cheese culture, salt and enzymes.",40],["Cultured pasteurized milk, salt, enzymes, color added.",37],["Pasteurized milk and cream, cheese culture, salt, stabilizers (carob bean and/or xanthan and/or guar gums).",36],["PASTEURIZED MILK, CHEESE CULTURE, SALT, ENZYMES, ANNATTO (VEGETABLE COLOR).",36],["Pasteurized milk, jalapeno peppers, cheese culture, salt, enzymes.",34],["PASTEURIZED MILK, CHEESE CULTURE, SALT, ENZYMES AND ANNATTO (VEGETABLE COLOR).",34]],"top_words":[["salt,",17784],["cheese",17217],["milk,",12323],["de",6512],["and",6409],["pasteurized",5704],["water,",4885],["culture,",4708],["oil,",4401],["sodium",4147],["flour,",4033],["natural",3882],["starch,",3624],["cheddar",3355],["cultures,",3352],["acid,",3320],["enzymes),",3242],["(pasteurized",3231],["enzymes,",3190],["corn",3036],["organic",2878],["wheat",2836],["gum,",2736],["milk",2731],["sugar,",2713]],"vocab_skipped":null,"word_histogram":{"counts":[25723,8419,4253,2562,1496,893,548,391,215,105,59,45,44,17,13,11,4,5,2,1,0,0,1,2,0,0,0,1,0,1],"edges":[1.0,22.833333333333332,44.666666666666664,66.5,88.33333333333333,110.16666666666666,132.0,153.83333333333331,175.66666666666666,197.5,219.33333333333331,241.16666666666666,263.0,284.8333333333333,306.66666666666663,328.5,350.3333333333333,372.16666666666663,394.0,415.8333333333333,437.66666666666663,459.5,481.3333333333333,503.16666666666663,525.0,546.8333333333333,568.6666666666666,590.5,612.3333333333333,634.1666666666666,656.0]}},"kind":"text","n":77145,"n_null":32334,"n_unique":30902,"null_rate":0.41913280186661483,"stats":{"allcaps_rate":0.08564861306375667,"boilerplate_rate":0.0,"duplicate_rate":0.3103925375465845,"emoji_rate":0.000223159492088996,"len_max":5283,"len_mean":238.2221552743746,"len_median":126.0,"len_min":0,"len_p95":842.0,"n_duplicates":13909,"n_empty":4981,"one_word_rate":0.1732610296578965,"readability_flesch_mean":16.005968190833443,"url_rate":0.002298542768516659,"vocab_size":35093,"word_mean":31.63863783446029,"word_median":16.0}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"labels_tags","extras":{},"kind":"unknown","n":77145,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"nutrition_grades_tags","extras":{},"kind":"unknown","n":77145,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"origins_tags","extras":{},"kind":"unknown","n":77145,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"multilingual","level":"info","message":"31 languages detected in sample"},{"code":"duplicates","level":"warn","message":"30.9% duplicate strings"}],"column":"product_name","extras":{"language_counts":{"__engine":"fasttext:4,813","bs":3,"ca":13,"ceb":4,"cs":7,"da":4,"de":169,"el":5,"en":3820,"eo":4,"es":114,"et":5,"fi":12,"fr":315,"hu":2,"id":4,"it":163,"ja":11,"ms":5,"nl":34,"nn":2,"no":4,"pl":21,"pt":20,"ro":4,"ru":17,"sk":3,"sv":8,"tr":13,"uk":6,"zh":3},"language_sample_size":5000,"length_histogram":{"counts":[1658,7931,16585,15617,12097,8979,4569,2949,2054,1107,796,562,297,201,135,105,99,96,63,70,54,56,49,35,37,30,13,22,11,12,15,10,4,5,5,4,2,2,1,3],"edges":[0.0,6.35,12.7,19.049999999999997,25.4,31.75,38.099999999999994,44.449999999999996,50.8,57.15,63.5,69.85,76.19999999999999,82.55,88.89999999999999,95.25,101.6,107.94999999999999,114.3,120.64999999999999,127.0,133.35,139.7,146.04999999999998,152.39999999999998,158.75,165.1,171.45,177.79999999999998,184.14999999999998,190.5,196.85,203.2,209.54999999999998,215.89999999999998,222.25,228.6,234.95,241.29999999999998,247.64999999999998,254.0]},"near_unique":false,"sample":["Cream Cheese","Queso Cottage proteico","Tim Hortons, Bacon, Egg White & Cheese On Maple Flatbread","Butter Cream Cheese Danish","Macaroni & cheese dinner","Parmesan And Breadcrumb Topped Macaroni And Cheese","Mazdamer","Cheddar Cheese w/ Scotch Bonnet Chili and Red Peppers","Old-fashioned cheese & onion potato chips","doritos tangy cheese","hellers bacon & cheese sausages","Flavored cream cheese, salted caramel","Popcorn Cheddar Cheese Taste","K\u00f6rniger Frischk\u00e4se","Macaroni Cheese Dinner","\u30ab\u30de\u30f3\u30d9\u30fc\u30eb\u30c1\u30fc\u30ba","Maasdam en tranches","Gruy\u00e8re","Pretzel Cheese Bun","Basil pesto parmesan crisps","Spring Haven Farms, Grated Romano Cheese","Provolone valpadana piccante","Black Bomber","Twisties Fromage Cheese","Big cheese pepper jack cheese","Fettine di formaggio fuso","Grated Romano Cheese","Kiri","Bio Groovier","Cheeseburger Mac and Cheese","Gouda 48+ cheese","Swiss Cheese","Colby cheese","The two layered cheese","Organic White Cheddar Macaroni & Cheese","Fromage frais ferme de lesneum","Goudse kaas 48+ overjarig","Hatch chile queso dip","Potato crisps, cheddar cheese","Canada fresca","Smoked Gouda Cheese","Grill- und Pfannenk\u00e4se","Kremost Naturell","Salad Chicken (Deluxe Finger - Triple Cheese Radish Dip)","Cheese - Jong belegen","Cotswold Double Gloucester Cheese","Harris teeter, fresh foods market, three cheese & spinach ravioli","Farmer Style Fresh Cheese","","Chicken Kiev with a Creamy Cheese & Paprika Filling in a Taco Panade Breadcrumb"],"top_values":[["Cottage Cheese",366],["",349],["Cottage cheese",345],["Cheese",328],["Mozzarella",269],["Cream Cheese",177],["Cream cheese",170],["Sharp Cheddar Cheese",151],["Mozzarella Cheese",142],["Swiss Cheese",129],["Mozzarella cheese",123],["Cheddar Cheese",119],["Mascarpone",117],["Pepper Jack Cheese",116],["Cheddar cheese",111],["Parmesan Cheese",110],["Mild Cheddar Cheese",110],["Gouda",108],["Fromage",104],["Macaroni & Cheese",103]],"top_words":[["cheese",13869],["&",2632],["cheddar",2257],["and",1218],["with",1073],["cream",898],["mozzarella",884],["cheese,",811],["jack",761],["cottage",630],["shredded",590],["pizza",553],["sharp",480],["white",476],["de",454],["mac",453],["queso",422],["macaroni",422],["parmesan",417],["gouda",404],["fromage",387],["natural",370],["style",366],["mild",355],["pepper",335]],"vocab_skipped":null,"word_histogram":{"counts":[18418,16822,14563,10071,9858,2116,1290,848,1055,285,201,122,186,88,70,60,56,71,28,31,19,32,14,7,7,10,3,4,1,4],"edges":[1.0,2.2333333333333334,3.466666666666667,4.7,5.933333333333334,7.166666666666667,8.4,9.633333333333333,10.866666666666667,12.100000000000001,13.333333333333334,14.566666666666666,15.8,17.033333333333335,18.266666666666666,19.5,20.733333333333334,21.96666666666667,23.200000000000003,24.433333333333334,25.666666666666668,26.900000000000002,28.133333333333333,29.366666666666667,30.6,31.833333333333336,33.06666666666667,34.300000000000004,35.53333333333333,36.766666666666666,38.0]}},"kind":"text","n":77145,"n_null":805,"n_unique":52776,"null_rate":0.010434895326981658,"stats":{"allcaps_rate":0.013466072832067069,"boilerplate_rate":0.0,"duplicate_rate":0.30867173172648676,"emoji_rate":0.00035368090123133353,"len_max":254,"len_mean":27.748952056588944,"len_median":24.0,"len_min":0,"len_p95":58.0,"n_duplicates":23564,"n_empty":349,"one_word_rate":0.059457689284778625,"readability_flesch_mean":63.62454960039961,"url_rate":0.0,"vocab_size":8852,"word_mean":4.2694262509824465,"word_median":4.0}},{"alerts":[{"code":"one_word","level":"warn","message":"29.7% rows are a single word"},{"code":"null_rate","level":"warn","message":"57.7% null"},{"code":"short_text","level":"info","message":"95th-percentile length under 20 chars"},{"code":"duplicates","level":"warn","message":"90.5% duplicate strings"}],"column":"quantity","extras":{"language_counts":{},"language_sample_size":5000,"length_histogram":{"counts":[4393,66,10984,12621,1264,413,462,129,1845,80,51,142,49,48,14,21,4,13,3,5,8,5,4,0,3,1,1,2,6,1,1,1,0,1,0,0,0,0,0,1],"edges":[0.0,1.45,2.9,4.35,5.8,7.25,8.7,10.15,11.6,13.049999999999999,14.5,15.95,17.4,18.849999999999998,20.3,21.75,23.2,24.65,26.099999999999998,27.55,29.0,30.45,31.9,33.35,34.8,36.25,37.699999999999996,39.15,40.6,42.05,43.5,44.949999999999996,46.4,47.85,49.3,50.75,52.199999999999996,53.65,55.1,56.55,58.0]},"near_unique":false,"sample":["165g","Fully Loaded MAC & CHEESE 100g","1 serving(s)","150 g","110 g","8 oz","","1 serving(s)","5kg","125 g","8 oz","99 g","105g (3x35g)","125 g","180 g","261 g","","","60g","300 g","8 oz","150 gr (6x25gr)","200 g","150 g","","8 oz","28 g","185 g","200 g","150g","","100 g","","300 g","200g","150 g","1 serving(s)","19 g","100 g","28 g","142 g","1 fl oz","250 g","1 serving(s)","24 oz/680 g","32 oz","1","220","100 g","113 g"],"top_values":[["",4252],["1 serving(s)",1576],["8 oz",1477],["200 g",1469],["28 g",1123],["150 g",1111],["250 g",992],["200g",696],["16 oz",524],["100 g",483],["150g",467],["6 oz",447],["12 oz",443],["250g",437],["125 g",430],["400 g",430],["500 g",415],["300 g",391],["7 oz",283],["10 oz",256]],"top_words":[["g",8539],["oz",3528],["1",1255],["8",1000],["serving(s)",985],["200",980],["150",714],["28",688],["250",673],["200g",454],["kg",442],["100",361],["16",345],["x",342],["6",340],["400",317],["12",315],["125",311],["150g",307],["500",285],["250g",284],["300",249],["10",216],["4",208],["7",208]],"vocab_skipped":null,"word_histogram":{"counts":[9710,0,21501,0,549,0,619,0,57,0,158,0,26,0,12,0,5,0,2,0,2,0,0,0,0,0,0,0,0,1],"edges":[1.0,1.5,2.0,2.5,3.0,3.5,4.0,4.5,5.0,5.5,6.0,6.5,7.0,7.5,8.0,8.5,9.0,9.5,10.0,10.5,11.0,11.5,12.0,12.5,13.0,13.5,14.0,14.5,15.0,15.5,16.0]}},"kind":"text","n":77145,"n_null":44503,"n_unique":3102,"null_rate":0.5768747164430618,"stats":{"allcaps_rate":0.010416028429630537,"boilerplate_rate":0.0,"duplicate_rate":0.9049690582684885,"emoji_rate":0.0,"len_max":58,"len_mean":4.739691195392439,"len_median":5.0,"len_min":0,"len_p95":12.0,"n_duplicates":29540,"n_empty":4252,"one_word_rate":0.2974695177991545,"readability_flesch_mean":102.593225,"url_rate":0.0,"vocab_size":1802,"word_mean":1.790607193186692,"word_median":2.0}}],"insights":{"errors":[],"insights":[{"confidence":"high","critiques":[],"evidence_keys":["row_count","column_count","columns.quantity.null_rate","columns.quantity.stats.duplicate_rate","columns.quantity.top_values","columns.ingredients_text.null_rate","columns.ingredients_text.language_counts","columns.product_name.language_counts","columns.product_name.top_values","columns.product_name.stats.duplicate_rate","columns.image_url.null_rate"],"featured_charts":[{"caption":"Most common quantity strings \u2014 note inconsistent formatting like '200 g' vs '200g' that will need normalization.","column":"quantity","kind":"bar"},{"caption":"Top product names are dominated by generic terms like 'Cottage Cheese' and 'Mozzarella', suggesting many non-unique entries.","column":"product_name","kind":"bar"},{"caption":"Ingredient text length is highly skewed (median 126 chars, max 5,283) \u2014 useful for spotting sparse vs. detailed entries.","column":"ingredients_text","kind":"length"},{"caption":"Product name length distribution shows most names are short (median 24 chars), with a long tail of verbose entries.","column":"product_name","kind":"length"}],"model":"anthropic:claude-opus-4-7","narrative":"This dataset contains 77,145 product records from Open Food Facts, focused on cheese products, with 10 columns covering names, ingredients, quantities, image URLs, and several tag fields (brands, categories, countries, labels, nutrition grades, origins). The text fields are highly multilingual \u2014 product_name spans 30+ languages with English (3,820) and French (315) dominating, and ingredients_text shows the same pattern. Two things deserve a closer look first: the heavy null rates on quantity (57.7%) and ingredients_text (41.9%), which will limit any analysis depending on those fields, and the strong duplication in quantity (90.5% duplicate rate) where values like '1 serving(s)', '8 oz', and '200 g' recur thousands of times. Product names also duplicate substantially (30.9%), with 'Cottage Cheese', 'Cheese', and 'Mozzarella' appearing as common generic labels. Note that the six tag-style columns were skipped during profiling, so their structure is not yet characterized.","scope":"dataset","target":"__global__"},{"confidence":"low","critiques":[],"evidence_keys":["alerts","column","kind","n","null_rate","stats","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"The column brands_tags was skipped by the profiler, so no descriptive statistics, uniqueness count, or value samples are available. The only confirmed facts are that it has 77145 rows and a null_rate of 0.0, meaning every row carries some value. Based on the name alone it likely holds brand tag strings, but without evidence this is not verified.","role":"other","scope":"column","target":"brands_tags","treatment":"Re-run profiling with string handling enabled before deciding on use."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","column","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column was skipped by the profiler, so no statistics, uniqueness, or value samples are available beyond a row count of 77145 and a null rate of 0.0. The name `categories_tags` suggests a multi-valued categorical field (likely a delimited list of category labels, e.g. from Open Food Facts), but this cannot be confirmed from the evidence.","role":"feature","scope":"column","target":"categories_tags","treatment":"Re-profile with list/string handling enabled, then split on the delimiter and one-hot or multi-hot encode before modelling."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `countries_tags` was skipped by the profiler, so no statistics beyond row count and null rate are available. All 77,145 rows are non-null, but uniqueness, distribution, and value examples are unknown. The name suggests a multi-valued tag field (e.g., comma- or colon-separated country codes like `en:france`), but this cannot be confirmed from the evidence.","role":"feature","scope":"column","target":"countries_tags","treatment":"Re-profile with a tag-aware parser (split on separator) before deciding on encoding or filtering."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.url_rate","stats.one_word_rate","stats.word_mean","stats.len_min","stats.len_max","stats.n_duplicates","top_words"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds Open Food Facts product image URLs, one per row, with url_rate of 1.0 and word_mean of 1.0 confirming each value is a single link. It is near-unique (47,035 distinct out of 77,145) and 39.03% null, so coverage is partial. Lengths are tightly bounded (75-96 chars) reflecting a fixed CDN path template, and only one duplicate URL appears.","role":"metadata","scope":"column","target":"image_url","treatment":"Drop for modelling; retain as a reference link for image fetching or manual inspection."},{"confidence":"high","critiques":[],"evidence_keys":["language_counts","null_rate","stats.n_empty","stats.duplicate_rate","stats.n_duplicates","stats.len_median","stats.len_max","stats.word_median","stats.readability_flesch_mean","top_values","top_words","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text ingredient lists from what looks like a food product database, dominated by English (1623 rows) but spanning 30 languages including French (212), German (128), and trace Thai/Korean/Arabic. 41.91% of values are null and 4981 are empty strings while another 2553 read literally as 'undefined', and 31.04% of non-null entries are exact duplicates \u2014 cheese-style boilerplate like 'Pasteurized milk, cheese culture, salt, enzymes.' recurs hundreds of times. Texts are short on average (word_median 16, len_median 126) but stretch to 5283 characters, and the Flesch mean of 16.0 reflects dense comma-separated lists rather than prose.","role":"free_text","scope":"column","target":"ingredients_text","treatment":"Normalise 'undefined'/empty to null, dedupe, and tokenize per detected language before embedding."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","column","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column \"labels_tags\" was skipped by the profiler, so no type, cardinality, or value statistics are available beyond a row count of 77145 and a null rate of 0.0. The name suggests a multi-valued tag or label field (likely comma- or pipe-delimited strings), but this cannot be confirmed from the evidence. No surprises can be flagged without underlying stats.","role":"other","scope":"column","target":"labels_tags","treatment":"Re-run the profiler with parsing for list-like strings before deciding on encoding."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","column","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column is named nutrition_grades_tags, suggesting it holds Nutri-Score-style grade tags (e.g., a\u2013e) for food products. Saturn skipped profiling, so no uniqueness, value distribution, or stats are available beyond a row count of 77145 with a null_rate of 0.0. Without cardinality or value samples, the actual content cannot be verified from the evidence.","role":"label","scope":"column","target":"nutrition_grades_tags","treatment":"Re-profile to recover value distribution before deciding; if it resolves to a small grade vocabulary, one-hot encode."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Column `origins_tags` was skipped by the profiler, so no type, cardinality, or value statistics are available beyond a row count of 77145 and a null rate of 0.0. The name suggests a tag-style field listing geographic origins, likely multi-valued (comma- or pipe-delimited) per row, but this cannot be confirmed from the evidence. No distributional signals can be assessed until the column is re-profiled.","role":"metadata","scope":"column","target":"origins_tags","treatment":"Re-run the profiler on this column; if multi-valued, split on the delimiter and one-hot or count-encode the tags."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.duplicate_rate","stats.n_duplicates","stats.n_empty","stats.len_mean","stats.word_median","top_values","top_words","language_counts","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Short product-name strings (mean 27.7 chars, median 4 words) for what looks like a cheese-dominated catalog \u2014 'cheese' appears 13,869 times and the top values are 'Cottage Cheese', 'Cheese', 'Mozzarella', etc. Of 77,145 rows, 30.9% are duplicates (23,564) and case-variant pairs like 'Cottage Cheese'/'cottage cheese' and 'Cream Cheese'/'Cream cheese' inflate that count; 349 rows are empty and null_rate is 1.04%. Although English dominates (3,820 detected), there is a multilingual tail (de 169, fr 315, it 163, es 114) that will fragment exact-match joins.","role":"free_text","scope":"column","target":"product_name","treatment":"Normalize case and whitespace to collapse near-duplicates, then tokenize/embed for modelling or fuzzy matching."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.duplicate_rate","stats.n_empty","stats.vocab_size","stats.word_mean","stats.len_mean","top_values","top_words"],"model":"anthropic:claude-opus-4-7","narrative":"This column captures food portion sizes as free-text quantity strings (e.g. '1 serving(s)', '8 oz', '200 g'), mixing units of grams, ounces and serving counts. It is sparse and repetitive: 57.69% of rows are null, 4252 are empty, and 90.5% of populated values are duplicates drawn from a vocabulary of just 1802 tokens. Note the inconsistent formatting \u2014 '200 g' (1469) and '200g' (696) are stored as separate strings, so naive grouping will undercount.","role":"feature","scope":"column","target":"quantity","treatment":"Parse into numeric magnitude + normalized unit (g/oz/serving), collapsing variants like '200 g' and '200g'."}],"providers":["anthropic:claude-opus-4-7"],"total_usage":{"completion_tokens":3586,"prompt_tokens":13760,"total_tokens":17346}},"language_counts":{"ar":1,"bg":8,"bs":3,"ca":15,"ceb":4,"cs":18,"da":10,"de":297,"el":8,"en":5443,"eo":4,"es":151,"et":6,"fi":20,"fr":527,"hr":5,"hu":6,"id":4,"it":185,"ja":13,"ko":1,"lt":2,"ms":5,"nl":52,"nn":2,"no":22,"pl":49,"pt":33,"ro":6,"ru":26,"sh":2,"sk":3,"sr":2,"sv":31,"th":1,"tr":15,"uk":8,"zh":3},"meta":{"generated_at":"2026-05-01T18:38:27+00:00","mode":"full","row_count":77145,"sampled_rows":77145,"seed":42,"source":"/home/coolhand/html/datavis/data_trove/cache/quirky/openfoodfacts_cheese_20260121.parquet"},"notes":[],"saturn_version":"0.2.0","schema":{"brands_tags":"unknown","categories_tags":"unknown","countries_tags":"unknown","image_url":"text","ingredients_text":"text","labels_tags":"unknown","nutrition_grades_tags":"unknown","origins_tags":"unknown","product_name":"text","quantity":"text"}}
