{"columns":[{"alerts":[{"code":"long_tail","level":"info","message":"5 singleton categories"}],"column":"update_key","extras":{"singletons":5,"top_values":[["brands",28],["sort",10],["divinfood",5],["key_1748337248",2],["nova-yogurts",1],["key_1744830970",1],["ingredients20240805",1],["germany2",1],["france",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":9,"null_rate":0.0,"stats":{"cardinality":9,"entropy":2.0151590049562578,"entropy_ratio":0.6357118872021776,"top_rate":0.56,"top_value":"brands"}},{"alerts":[{"code":"long_tail","level":"info","message":"41 singleton categories"}],"column":"categories_old","extras":{"singletons":41,"top_values":[["Snacks, Snacks sucr\u00e9s, Biscuits et g\u00e2teaux, Biscuits, Biscuits secs",2],["Snacks, Snacks sucr\u00e9s, Biscuits et g\u00e2teaux, Biscuits",2],["Aliments et boissons \u00e0 base de v\u00e9g\u00e9taux, Aliments d'origine v\u00e9g\u00e9tale, Snacks, C\u00e9r\u00e9ales et pommes de terre, Pains, Tartines craquantes extrud\u00e9es, Pains croustillants",2],["Snacks, Sweet snacks, Cocoa and its products, Chocolates, Dark chocolates",2],["Dairies, Fermented foods, Fermented milk products, Cheeses, Cream cheeses, fr:Fromages-frais-sucres, en:yogurts",1],["Snacks, Snacks sucr\u00e9s, Cacao et d\u00e9riv\u00e9s",1],["Przek\u0105ski, S\u0142odkie przek\u0105ski, Kakao i produkty na bazie kakao, Czekolada, Czekolada deserowa, Czekolada gorzka",1],["\u0417\u0430\u043a\u0443\u0441\u043a\u0438, \u0421\u043b\u0430\u0434\u043a\u0438 \u0437\u0430\u043a\u0443\u0441\u043a\u0438, \u041a\u0430\u043a\u0430\u043e\u0432\u0438 \u0438\u0437\u0434\u0435\u043b\u0438\u044f, \u0428\u043e\u043a\u043e\u043b\u0430\u0434\u0438, \u0422\u044a\u043c\u0435\u043d \u0448\u043e\u043a\u043e\u043b\u0430\u0434",1],["Boissons et pr\u00e9parations de boissons, Boissons, Eaux, Eaux de sources, Boissons sans sucre ajout\u00e9",1],["Snacks, Snacks sucr\u00e9s, Confiseries, Succ\u00e9dan\u00e9s du chocolat, en:Vegecaos",1],["Snacks, Sweet snacks, Cocoa and its products, Confectioneries, Chocolates, Dark chocolates",1],["Snacks, Snacks sucr\u00e9s, Biscuits et g\u00e2teaux, Biscuits, en:Biscuits et g\u00e2teaux, en:Snacks sucr\u00e9s",1],["Snacks, Snacks sucr\u00e9s, Biscuits et g\u00e2teaux, Biscuits, Biscuits sabl\u00e9s, Sabl\u00e9s \u00e0 la noix de coco",1],["Botanas,Snacks dulces,Galletas y pasteles,Galletas,Galletas rellenas",1],["Produits laitiers, Produits ferment\u00e9s, Produits laitiers ferment\u00e9s, Snacks, Fromages, Snacks sucr\u00e9s, Cacao et d\u00e9riv\u00e9s, Chocolats, Chocolats noirs, Chocolats noirs en tablette, Chocolat noir en tablette extra d\u00e9gustation \u00e0 70% de cacao minimum",1],["Aliments et boissons \u00e0 base de v\u00e9g\u00e9taux, Aliments d'origine v\u00e9g\u00e9tale, Snacks, C\u00e9r\u00e9ales et pommes de terre, Snacks sal\u00e9s, Amuse-gueules, Chips et frites, Chips, Chips de pommes de terre, Chips de pommes de terre \u00e0 l'huile de tournesol, en:Aliments d'origine v\u00e9g\u00e9tale, en:Aliments et boissons \u00e0 base de v\u00e9g\u00e9taux, en:Amuse-gueules, en:Chips, en:Chips de pommes de terre, en:Chips de pommes de terre classiques, en:Chips de pommes de terre \u00e0 l'huile de tournesol, en:Chips et frites, en:C\u00e9r\u00e9ales et pommes de terre, en:Snacks sal\u00e9s",1],["Snacks, Snacks sucr\u00e9s, Cacao et d\u00e9riv\u00e9s, Chocolats, Chocolats noirs, Chocolats noirs en tablette",1],["Snacks,Sweet snacks,Biscuits and cakes,Biscuits,Chocolate biscuits,Filled biscuits,Dark chocolate biscuits",1],["Snacks, Sweet snacks, Cocoa and its products, Chocolates, Dark chocolates, Cacao-et-derives, Chocolats, Chocolats-noirs, Chocolats-noirs-extra-fin",1],["Aliments et boissons \u00e0 base de v\u00e9g\u00e9taux,Aliments d'origine v\u00e9g\u00e9tale,C\u00e9r\u00e9ales et pommes de terre,Pains,Pains croustillants",1]]},"kind":"categorical","n":50,"n_null":1,"n_unique":45,"null_rate":0.02,"stats":{"cardinality":45,"entropy":5.45144453799276,"entropy_ratio":0.9926420904514142,"top_rate":0.04081632653061224,"top_value":"Snacks, Snacks sucr\u00e9s, Biscuits et g\u00e2teaux, Biscuits, Biscuits secs"}},{"alerts":[],"column":"ecoscore_score","extras":{"histogram":{"counts":[10,4,12,8,6,3],"edges":[13.0,26.5,40.0,53.5,67.0,80.5,94.0]},"sample":[72.0,44.0,26.0,20.0,57.0,40.0,52.0,40.0,47.0,58.0,41.0,29.0,85.0,55.0,26.0,70.0,40.0,90.0,64.0,40.0,64.0,26.0,28.0,94.0,70.0,13.0,21.0,60.0,21.0,43.0,53.0,76.0,25.0,77.0,27.0,50.0,38.0,26.0,57.0,69.0,15.0,40.0,64.0]},"kind":"numeric","n":50,"n_null":7,"n_unique":31,"null_rate":0.14,"stats":{"iqr":36.5,"kurtosis":-0.794581810915528,"max":94.0,"mean":47.74418604651163,"median":44.0,"min":13.0,"n_outliers":0,"outlier_rate":0.0,"q1":27.5,"q3":64.0,"skew":0.3068531918571063,"std":21.189724624894215,"zero_rate":0.0}},{"alerts":[{"code":"null_rate","level":"warn","message":"56.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"environment_impact_level","extras":{"singletons":0,"top_values":[["",22]]},"kind":"categorical","n":50,"n_null":28,"n_unique":1,"null_rate":0.56,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"3 singleton categories"},{"code":"null_rate","level":"warn","message":"90.0% null"}],"column":"ingredients_text_fi","extras":{"singletons":3,"top_values":[["",2],["kaakaomassa, kaakaovoi, v\u00e4h\u00e4rasvainen kaakaojauhe, sokeri, vanilja. Saattaa sis\u00e4lt\u00e4\u00e4 hasselp\u00e4hkin\u00e4\u00e4, muita p\u00e4hkin\u00f6it\u00e4, maitoa, soijaa. Tummassa suklaassa kaakaota v\u00e4hint\u00e4\u00e4n 90%.",1],["kaakaomassa, v\u00e4h\u00e4rasvainen kaakaojauhe, kaakaovoi, sokeri, emulgointiaine (_soijalesitiini_), vaniljauute. Suklaassa kaakaota v\u00e4hint\u00e4\u00e4n 85 %. Saattaa sis\u00e4lt\u00e4\u00e4 pieni\u00e4 m\u00e4\u00e4ri\u00e4 p\u00e4hkin\u00e4\u00e4 ja maitoa.",1],["_VEHN\u00c4JAUHO_, palmu\u00f6ljy, t\u00e4rkkelyssiirappi, _OHRAMALLASUUTE_, nostatusaineet ammoniumkarbonaatit, natriumkarbonaatit), suola, _KANANMUNAT_, aromi, jauhonparanne (_NATRIUMDISULFIITTI_).",1]]},"kind":"categorical","n":50,"n_null":45,"n_unique":4,"null_rate":0.9,"stats":{"cardinality":4,"entropy":1.9219280948873623,"entropy_ratio":0.9609640474436811,"top_rate":0.4,"top_value":""}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"nutrition_data_prepared","extras":{"singletons":0,"top_values":[["",48]]},"kind":"categorical","n":50,"n_null":2,"n_unique":1,"null_rate":0.04,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"packaging_shapes_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"nutrient_levels_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"packagings_materials","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"ingredients_without_ecobalyse_ids","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"3 singleton categories"},{"code":"null_rate","level":"warn","message":"76.0% null"}],"column":"generic_name_nl","extras":{"singletons":3,"top_values":[["",9],["Extra fijne pure chocolade",1],["Biscuits bedekt met melkchocolade",1],["Krokante volkorentoasts",1]]},"kind":"categorical","n":50,"n_null":38,"n_unique":4,"null_rate":0.76,"stats":{"cardinality":4,"entropy":1.207518749639422,"entropy_ratio":0.603759374819711,"top_rate":0.75,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"misc_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"4 singleton categories"},{"code":"null_rate","level":"warn","message":"92.0% null"}],"column":"product_name_sv","extras":{"singletons":4,"top_values":[["90% Cocoa",1],["Arriba 85% Cacao Dark Chocolate",1],["Dark 70%",1],["Original",1]]},"kind":"categorical","n":50,"n_null":46,"n_unique":4,"null_rate":0.92,"stats":{"cardinality":4,"entropy":2.0,"entropy_ratio":1.0,"top_rate":0.25,"top_value":"90% Cocoa"}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=+3.90"},{"code":"outliers","level":"warn","message":"8.0% rows beyond 1.5 IQR"}],"column":"scans_n","extras":{"histogram":{"counts":[39,7,3,0,0,0,1],"edges":[333.0,645.8571428571429,958.7142857142857,1271.5714285714284,1584.4285714285713,1897.2857142857142,2210.142857142857,2523.0]},"sample":[2523.0,1091.0,1114.0,1110.0,921.0,775.0,764.0,771.0,717.0,638.0,726.0,692.0,606.0,576.0,598.0,574.0,558.0,547.0,540.0,524.0,505.0,517.0,529.0,479.0,596.0,478.0,447.0,438.0,506.0,411.0,408.0,443.0,404.0,391.0,386.0,381.0,400.0,390.0,383.0,376.0,405.0,367.0,384.0,381.0,357.0,354.0,358.0,379.0,346.0,333.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":49,"null_rate":0.0,"stats":{"iqr":217.0,"kurtosis":18.723151379432267,"max":2523.0,"mean":577.94,"median":492.0,"min":333.0,"n_outliers":4,"outlier_rate":0.08,"q1":387.0,"q3":604.0,"skew":3.899183874756958,"std":343.9457367026351,"zero_rate":0.0}},{"alerts":[{"code":"constant","level":"info","message":"only one distinct value"}],"column":"schema_version","extras":{"histogram":{"counts":[0,0,0,50,0,0,0],"edges":[995.5,995.6428571428571,995.7857142857143,995.9285714285714,996.0714285714286,996.2142857142857,996.3571428571429,996.5]},"sample":[996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0,996.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":1,"null_rate":0.0,"stats":{"iqr":0.0,"kurtosis":0.0,"max":996.0,"mean":996.0,"median":996.0,"min":996.0,"n_outliers":0,"outlier_rate":0.0,"q1":996.0,"q3":996.0,"skew":0.0,"std":0.0,"zero_rate":0.0}},{"alerts":[{"code":"long_tail","level":"info","message":"50 singleton categories"}],"column":"url","extras":{"singletons":50,"top_values":[["https://world.openfoodfacts.org/product/6111242100992/perly",1],["https://world.openfoodfacts.org/product/7622210449283/prince-gout-chocolat-lu",1],["https://world.openfoodfacts.org/product/3046920029759/edelbitter-schokolade-lindt",1],["https://world.openfoodfacts.org/product/6111031005064/tonik-%D8%B9%D8%B1%D8%A8%D9%8A",1],["https://world.openfoodfacts.org/product/3175680011480/gerble-sesame-cookie-230g-8-2oz",1],["https://world.openfoodfacts.org/product/20995553/chocolat-noir-85-cacao-j-d-gross",1],["https://world.openfoodfacts.org/product/3268840001008/hhhhh-cristaline",1],["https://world.openfoodfacts.org/product/3362600011044/henry-s",1],["https://world.openfoodfacts.org/product/8425197712024/compound-chocolate-with-milk-and-almonds-maruja",1],["https://world.openfoodfacts.org/product/7622210578464/organic-70-dark-chocolate-bar-green-black-s",1],["https://world.openfoodfacts.org/product/6111259343108/king-cookies-excelo",1],["https://world.openfoodfacts.org/product/3362600011228/sable-coco-henry-s-42g",1],["https://world.openfoodfacts.org/product/8000500310427/biscuits-nutella",1],["https://world.openfoodfacts.org/product/7300400481595/authentique-wasa",1],["https://world.openfoodfacts.org/product/3046920022651/excellence-noir-intense-70-cacao-lindt",1],["https://world.openfoodfacts.org/product/5060042641000/tyrell-s-lightly-sea-salted-tyrrell-s",1],["https://world.openfoodfacts.org/product/7622210584724/intense-dark-chocolate-green-and-black",1],["https://world.openfoodfacts.org/product/3046920022606/excellence-85-cacao-chocolat-noir-puissant-lindt-lindt",1],["https://world.openfoodfacts.org/product/3229820100234/filled-dark-chocolate-bjorg",1],["https://world.openfoodfacts.org/product/20022464/extra-dark-74-cocoa-fin-carre",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":50,"null_rate":0.0,"stats":{"cardinality":50,"entropy":5.643856189774725,"entropy_ratio":1.0000000000000002,"top_rate":0.02,"top_value":"https://world.openfoodfacts.org/product/6111242100992/perly"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"vitamins_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"debug_param_sorted_langs","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"40 singleton categories"}],"column":"packaging","extras":{"singletons":40,"top_values":[["Plastique",4],["Packet,Hdpe film-packet,Etui en carton,Film en plastique",1],["en:Aluminium wrap,en:Box cardboard,en:Caja de cart\u00f3n,en:Card-box,en:Foil-wrapper,es:Recipiente,pt:Papel de aluminio,\u00c9tui carton,Feuille aluminium",1],["Cardboard,Plastic",1],["Cardboard,Non-corrugated cardboard",1],["Plastique,Bouteille ou Flacon,PET 1 - Polyt\u00e9r\u00e9phtalate d'\u00e9thyl\u00e8ne,Bouteille,Bouchon en plastique",1],["M\u00e9tal,Papier,en:Recyclable Metals,Aluminium",1],["Paper/Foil",1],["Plastique,O 7 - Autres plastiques",1],["Papier,Enveloppe,en:Package paper,en:Paper recycling",1],["M\u00e9tal,Carton,M\u00e9taux recyclables,Aluminium",1],["en:MixedPlasticFilm-packet,en:mixed plastic film-packet",1],["1 film to recycle, 1 paper wrap to recycle, en:paper-wrapper, en:foil-wrapper",1],["fr:emballage carton,fr:papier aluminium",1],["\u00c9tui,Carton,Plastique,Sec,Film",1],["Plastikowe,Mixed plastic-packet,Sachet plastique de 3g,",1],["Carta,Busta",1],["Papier",1],["",1],["Pl\u00e1stico",1]]},"kind":"categorical","n":50,"n_null":6,"n_unique":41,"null_rate":0.12,"stats":{"cardinality":41,"entropy":5.277613436819116,"entropy_ratio":0.9850792735693349,"top_rate":0.09090909090909091,"top_value":"Plastique"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"grades","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"outliers","level":"warn","message":"12.0% rows beyond 1.5 IQR"}],"column":"last_modified_t","extras":{"histogram":{"counts":[3,1,1,2,3,8,32],"edges":[1737907641.0,1742298509.4285715,1746689377.857143,1751080246.2857144,1755471114.7142856,1759861983.142857,1764252851.5714285,1768643720.0]},"sample":[1768557199.0,1762997306.0,1768540604.0,1768504085.0,1757883911.0,1767814111.0,1761570954.0,1768001556.0,1745147085.0,1751977023.0,1767353907.0,1738845211.0,1768042908.0,1767757809.0,1759572852.0,1767705743.0,1760267634.0,1766162622.0,1761393049.0,1762240662.0,1768643720.0,1738845015.0,1764601816.0,1767819312.0,1768137111.0,1767437745.0,1768380967.0,1764429510.0,1748385396.0,1767521360.0,1767603669.0,1764175241.0,1768556517.0,1759747781.0,1767601341.0,1762163269.0,1764945307.0,1767183580.0,1767096588.0,1767515080.0,1764511895.0,1767722174.0,1766330181.0,1761737635.0,1767728546.0,1766831716.0,1768494060.0,1737907641.0,1765376778.0,1755204544.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":50,"null_rate":0.0,"stats":{"iqr":6137869.0,"kurtosis":2.9715855401992988,"max":1768643720.0,"mean":1762859434.52,"median":1766580948.5,"min":1737907641.0,"n_outliers":6,"outlier_rate":0.12,"q1":1761612624.25,"q3":1767750493.25,"skew":-1.9610565054403708,"std":8093374.42102295,"zero_rate":0.0}},{"alerts":[{"code":"null_rate","level":"warn","message":"76.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_nl","extras":{"singletons":0,"top_values":[["",12]]},"kind":"categorical","n":50,"n_null":38,"n_unique":1,"null_rate":0.76,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[],"column":"allergens_lc","extras":{"singletons":3,"top_values":[["en",22],["fr",21],["es",2],["de",1],["it",1],["pl",1]]},"kind":"categorical","n":50,"n_null":2,"n_unique":6,"null_rate":0.04,"stats":{"cardinality":6,"entropy":1.5777508030466874,"entropy_ratio":0.6103573272751633,"top_rate":0.4583333333333333,"top_value":"en"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"states_hierarchy","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_ja","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"teams_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"29 singleton categories"}],"column":"traces_from_user","extras":{"singletons":29,"top_values":[["(en) ",7],["(fr) ",4],["(fr) en:milk,en:nuts",4],["(en) en:milk,en:nuts",2],["(en) en:milk,en:nuts,en:sesame-seeds,en:soybeans",2],["(en) en:nuts",2],["(en) Eggs",1],["(fr) en:milk,en:nuts,en:soybeans",1],["(fr) en:eggs,en:lupin,en:milk,en:mustard,en:nuts,en:soybeans",1],["(fr) en:milk,en:soybeans",1],["(fr) Lait,Fruits \u00e0 coque",1],["(fr) Soja",1],["(es) en:mustard",1],["(fr) en:lupin,en:milk,en:mustard,en:sesame-seeds,en:soybeans",1],["(fr) en:milk,en:nuts,en:sesame-seeds,en:soybeans",1],["(en) en:milk",1],["(fr) Lait,Fruits \u00e0 coque,Graines de s\u00e9same,Soja",1],["(en) en:eggs,en:mustard,en:nuts,en:sesame-seeds,en:soybeans",1],["(en) en:gluten,en:Amande,en:Arachides,en:Avoine,en:Bl\u00e9,en:Lait,en:Noisettes,en:Noix,en:Noix de cajou,en:Noix de macadamia,en:Noix de p\u00e9can,en:Noix du br\u00e9sil,en:Orge,en:Pistaches,en:Seigle",1],["(fr) en:lupin,en:milk,en:mustard,en:soybeans",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":35,"null_rate":0.0,"stats":{"cardinality":35,"entropy":4.8108265006866615,"entropy_ratio":0.9379140290745782,"top_rate":0.14,"top_value":"(en) "}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"origins_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 97.8% of rows"}],"column":"serving_quantity_unit","extras":{"singletons":1,"top_values":[["g",45],["ml",1]]},"kind":"categorical","n":50,"n_null":4,"n_unique":2,"null_rate":0.08,"stats":{"cardinality":2,"entropy":0.15109697051711368,"entropy_ratio":0.15109697051711368,"top_rate":0.9782608695652174,"top_value":"g"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"vitamins_prev_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"ingredients_hierarchy","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=+3.91"},{"code":"outliers","level":"warn","message":"8.0% rows beyond 1.5 IQR"}],"column":"unique_scans_n","extras":{"histogram":{"counts":[39,7,3,0,0,0,1],"edges":[319.0,595.8571428571429,872.7142857142857,1149.5714285714284,1426.4285714285713,1703.2857142857142,1980.1428571428569,2257.0]},"sample":[2257.0,1050.0,1045.0,888.0,829.0,726.0,723.0,666.0,640.0,612.0,611.0,590.0,562.0,557.0,552.0,536.0,527.0,516.0,502.0,495.0,473.0,467.0,458.0,449.0,435.0,429.0,421.0,413.0,395.0,390.0,387.0,381.0,381.0,377.0,369.0,366.0,365.0,362.0,360.0,356.0,349.0,348.0,344.0,343.0,334.0,334.0,331.0,326.0,323.0,319.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":48,"null_rate":0.0,"stats":{"iqr":198.0,"kurtosis":18.710636942247405,"max":2257.0,"mean":525.38,"median":432.0,"min":319.0,"n_outliers":4,"outlier_rate":0.08,"q1":362.75,"q3":560.75,"skew":3.910706375689542,"std":306.40908296336283,"zero_rate":0.0}},{"alerts":[{"code":"long_tail","level":"info","message":"41 singleton categories"}],"column":"labels","extras":{"singletons":41,"top_values":[["",8],["Distributor labels,Charte LU Harmony,Triman",1],["Point Vert,Triman",1],["No preservatives, Made in France, Natural flavors, No colorings, No palm oil, Nutriscore, Nutriscore Grade B, Triman, en:green-dot",1],["Vegetarian,Fair trade,Fairtrade International,No artificial flavors,Vegan,Fairtrade cocoa,FSC,FSC Mix,Max Havelaar",1],["Triman,Sans Nitrates",1],["Green Dot,Made in Spain,Ce",1],["Commerce \u00e9quitable,Bio,V\u00e9g\u00e9tarien,Bio europ\u00e9en,Fairtrade International,V\u00e9g\u00e9talien,PL-EKO-07,en:Soil Association Organic,The Vegan Society,en:Commerce \u00e9quitable",1],["Green Dot",1],["Vegetariano,fr:Ponto Verde",1],["V\u00e9g\u00e9tarien,Point Vert,Triman",1],["Sans conservateurs,Fabriqu\u00e9 en France,Triman,Lindt & Spr\u00fcngli Cacao Farming Program",1],["No gluten,Vegetarian,No artificial flavors,Vegan,Assured Food Standards,Green Dot,No artificial colors,No flavour enhancer,No MSG,Triman,Made-in-england,Terracycle",1],["Commerce \u00e9quitable,Bio,V\u00e9g\u00e9tarien,Bio europ\u00e9en,Fairtrade International,Agriculture non UE,V\u00e9g\u00e9talien,FR-BIO-01,en:FSC,FSC Mix,Point Vert,Max Havelaar,PL-EKO-07,en:Soil Association Organic,The Vegan Society",1],["Agriculture non UE,Fabriqu\u00e9 en Belgique,Fabriqu\u00e9 en France,Sans huile de palme,Triman",1],["Organic,EU Organic,Non-EU Agriculture,Certified B Corporation,EU Agriculture,EU/non-EU Agriculture,FR-BIO-01,No palm oil,Pure cocoa butter,AB Agriculture Biologique,fr:Farine de bl\u00e9 fran\u00e7ais",1],["Vegetarian,Fair trade,Fairtrade International,Vegan,Fairtrade cocoa,Pure cocoa butter,Rainforest Alliance,Rainforest Alliance Cocoa,Commerce-equitable",1],["V\u00e9g\u00e9tarien,Source de fibres alimentaires,Point Vert,Riche en fibres,Triman,Emballage-recyclable",1],["Halal",1],["en:Unknown",1]]},"kind":"categorical","n":50,"n_null":1,"n_unique":42,"null_rate":0.02,"stats":{"cardinality":42,"entropy":5.124913925747862,"entropy_ratio":0.9504102826177653,"top_rate":0.16326530612244897,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"7 singleton categories"}],"column":"generic_name_en","extras":{"singletons":7,"top_values":[["",36],["Extra fine dark chocolate 90% cocoa",1],["Dark chocolate",1],["Compound Chocolate with MILK AND ALMONDS",1],["Lightly sea salted potato chips",1],["Crackers",1],["Dark Chocolate 70% cocoa",1],["Chocolate bar with milk and hazelnuts",1]]},"kind":"categorical","n":50,"n_null":7,"n_unique":8,"null_rate":0.14,"stats":{"cardinality":8,"entropy":1.0979554511689993,"entropy_ratio":0.36598515038966645,"top_rate":0.8372093023255814,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"weighters_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"popularity_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"3 singleton categories"},{"code":"null_rate","level":"warn","message":"90.0% null"}],"column":"product_name_fi","extras":{"singletons":3,"top_values":[["",2],["Excellence: 90% cocoa Dark Supreme",1],["Arriba 85% Cacao Dark Chocolate",1],["Original",1]]},"kind":"categorical","n":50,"n_null":45,"n_unique":4,"null_rate":0.9,"stats":{"cardinality":4,"entropy":1.9219280948873623,"entropy_ratio":0.9609640474436811,"top_rate":0.4,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"6 singleton categories"}],"column":"origin_fr","extras":{"singletons":6,"top_values":[["",40],["Fabriqu\u00e9 par: Aachen Allemagne",1],["Germe de bl\u00e9 origine ue. S\u00e9same origine non-ue.",1],["France",1],["fabriqu\u00e9 en France.pommes origine UE. noisettes origine UE et non UE",1],["Fabriqu\u00e9 en France par Nutrition et Sant\u00e9. Farine de bl\u00e9: France. Figues : non UE",1],["P\u00e2te de cacao (Afrique de l'Ouest, Am\u00e9rique du Sud)Afrique, Europe, Madagascar, Am\u00e9rique du Sud, Afrique de l'Ouest",1]]},"kind":"categorical","n":50,"n_null":4,"n_unique":7,"null_rate":0.08,"stats":{"cardinality":7,"entropy":0.8957983952853935,"entropy_ratio":0.3190898266004902,"top_rate":0.8695652173913043,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"27 singleton categories"}],"column":"generic_name","extras":{"singletons":27,"top_values":[["",21],["BISCUITS FOURR\u00c9S (35%) PARFUM CHOCOLAT",1],["Chocolat noir extra-fin traditionnel \u00e0 90% de cacao",1],["Biscuits au s\u00e9same",1],["Eau de source",1],["Compound Chocolate with MILK AND ALMONDS",1],["Sabl\u00e9 coco",1],["Biscuit fourr\u00e9 \u00e0 la p\u00e2te \u00e0 tartiner aux noisettes et au cacao Nutella\u00ae",1],["Pain croustillant a la farine de seigle",1],["Chocolat noir extra-fin traditionnel",1],["Chips de pommes de terre l\u00e9g\u00e8rement sal\u00e9es au sel de mer",1],["Chocolat noir extra fin, traditionnel",1],["go\u00fbters fourr\u00e9s au chocolat noir",1],["Pain croustillant \u00e0 la farine compl\u00e8te de seigle, avoine et s\u00e9same.",1],["Crackers",1],["Dark Chocolate 70% cocoa",1],["Biscuits aux pommes et aux noisettes, tr\u00e8s pauvres en sel, riches en vitamines B1, B2, B9 et E et source de vitamines PP et B6",1],["Nuss-Nugat-Creme",1],["Snack Sal\u00e9",1],["Biscuits au son de bl\u00e9 et la figue, riches en fibres, magnesium et phosphore, source de fer, et tres pauvres en sodium.",1]]},"kind":"categorical","n":50,"n_null":2,"n_unique":28,"null_rate":0.04,"stats":{"cardinality":28,"entropy":3.663323628255448,"entropy_ratio":0.762024790690408,"top_rate":0.4375,"top_value":""}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"nutriscore_version","extras":{"singletons":0,"top_values":[["2023",50]]},"kind":"categorical","n":50,"n_null":0,"n_unique":1,"null_rate":0.0,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"2023"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"ingredients_without_ciqual_codes","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"manufacturing_places_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"photographers_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"null_rate","level":"warn","message":"90.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_pl","extras":{"singletons":0,"top_values":[["",5]]},"kind":"categorical","n":50,"n_null":45,"n_unique":1,"null_rate":0.9,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"informers_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"35 singleton categories"}],"column":"ingredients_text_en","extras":{"singletons":35,"top_values":[["",9],["milk cream, cream, sugar, banana, bacteria",1],["WHEAT flour 35%, whole WHEAT flour 15.7%, sugar, vegetable oils (palm, rapeseed), low-fat cocoa powder 4.5%, glucose syrup, WHEAT starch, raising agents (ammonium bicarbonate, sodium bicarbonate, disodium diphosphate), emulsifiers (SOY lecithin, sunflower lecithin), salt, skimmed MILK powder, lactose and MILK proteins, flavors, MAY CONTAIN EGG.",1],["cocoa mass, cocoa butter, fat reduced cocoa, sugar, vanilla",1],["Wheat flour, brown cane sugar, rapeseed oil, toasted sesame 10.6%, wheat germ 5.4%, whole wheat flour 5.4%, natural flavor, magnesium, emulsifier: lecithins, raising agents (potassium tartrates, sodium carbonates, ammonium carbonates), sea salt, wheat starch, vitamins (E, PP, B6, B1, B9).",1],["cocoa mass, low-fat cocoa powder, cocoa butter, sugar, emulsifier: lecithin (soy), vanilla extract, may contain traces of nuts and milk,",1],["Hhhhh",1],["sugar, cocoa butter, whole milk powder, cocoa mass, almonds, emulsifier (soya lecithin), flavoring",1],["cocoa mass #, cane sugar #, cocoa butter #, vanilla extract #, may contain nuts, milk,",1],["wholemeal rye flour (77 g*), rye flour (28 g*), yeast, salt, may contain traces of milk and sesame seeds, *in g per 100 g of product,",1],["cocoa paste, sugar, cocoa butter, vanilla,",1],["Potatoes, sunflower oil, sea salt. May contain Milk.",1],["cocoa mass, cocoa butter, fat-reduced cocoa powder, cane sugar, vanilla extract",1],["P\u00e2te de cacao, cacao maigre, beurre de cacao, cassonade, vanille bourbon naturelle en gousse.",1],["_Wheat_ flour 39%, dark chocolate 25% (cocoa mass, cane sugar, cocoa butter), unrefined brown cane sugar, wholemeal _wheat_ flour 15%, oleic sunflower oil, natural vanilla flavouring, skimmed _milk_ powder, sea salt, raising agents: ammonium carbonates, sodium carbonates, thickener: acacia gum, antioxidant: rosemary extract.",1],["cocoa mass, sugar, cocoa butter, fat reduced cocoa powder, emulsifier: lecithins (soya), natural vanilla flavouring, dark chocolate contains: cocoa solids 74% minimum,",1],["whole rye flour (57 g), wheat bran (27 g), oatmeal (13 g), sesame seeds (7.9 g), wheat germ, salt.",1],["wheat  flour, palm oil, glucose syrup,  barley  malt extract, raising agents (ammonium carbonates, sodium carbonates), salt,  eggs , flavouring, flour treatment agent (sodium  metabisulfite ),",1],["cocoa mass, sugar, cocoa butter, vanilla,",1],["Farine de ma\u00efs* (70%), farine de riz*, sel marin. * K issus de l'agriculture biologique. \u2022 sans sucres ajout\u00e9s(\u00b9) (contient des sucres naturellement pr\u00e9sents.",1]]},"kind":"categorical","n":50,"n_null":6,"n_unique":36,"null_rate":0.12,"stats":{"cardinality":36,"entropy":4.811037868342278,"entropy_ratio":0.9305817525399476,"top_rate":0.20454545454545456,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"11 singleton categories"},{"code":"null_rate","level":"warn","message":"68.0% null"}],"column":"ingredients_text_it","extras":{"singletons":11,"top_values":[["",5],["Pasta di cacao, burro di cacao, cacao magro in polvere, zucchero. Pu\u00f2 contenere nocciole, mandorle, altra frutta a guscio, latte, soia.",1],["crema alle NOCCIOLE e al cacao 40% (zucchero, olio di palma, NOCCIOLE 13%, LATTE Scremato in polvere 8.7%, cacao magro 7,4%, emulsionanti: lecitine (SOIA): vanillina), farina di FRUMENTO (32%), grassi vegetali (palma, palmisto), zucchero di canna (9%), LATTOSIO, crusca di FRUMENTO, LATTE intero in polvere, estratto in polvere di malto d'ORZO e mais, miele, agenti lievitanti (difosfato disodico. carbonato acido di ammonio, carbonato acido di sodio), cacao magro, sale, amido di FRUMENTO, farina di ORZO maltato, emulsionanti: lecitine (SOIA), vanillina.",1],["pasta di cacao, zucchero, burro di cacao, vaniglia",1],["patate, olio di girasole, sale marino.",1],["Pasta di cacao, cacao magro, burro di cacao, zucchero grezzo di canna, vaniglia.",1],["Farina integrale di _segale_ (59 g), crusca di _grano_ (27 g), fiocchi d'_avena_ (12 g), semi di _sesamo_ (7,0 g), germe di _grano_, sale. Pu\u00f2 contenere tracce di _latte_.",1],["Farina di _FRUMENTO_, olio di palma, sciroppo di glucosio, estratto di malto d'_ORZO_, agenti lievitanti (carbonati di ammonio, carbonati di sodio), sale, _UOVA_, aroma, agente di trattamento della farina (_METABISOLFITO_ di sodio).",1],["Pasta di cacao, zucchero, burro di cacao, vaniglia.",1],["Massa di cacao, zucchero, burro di cacao, emulsionante: lecitine (soia); estratto di vaniglia. Pu\u00f2 contenere tracce di frutta a guscio e latte. Il 40% della massa di cacao proviene da piantagioni selezionate dell'Ecuador.",1],["wdrated potatoes, sunflower oll, wheat flour, corn lour.test NRC b ber otin. Emulgator (E471), Salz, Farbstoff (Annatto Norbirin, k hottom (BB). Packaged in a protective atmosphere, (DE) KNAEF Kam ef s1sel colorant (n0rbixine de rocou). Peut contenir lait, soja. \u00c0 conse gie vepackt. (FR) SNACK SALE. INGREDIENTS: Pommes de terre disht SNCK SALATO. : Patate disidratate, olio di girasole, (arina d frmu botisiha d annatto). Puo contenere latte, sola. Da consumarsi prelerbilmetp SEL NGREDIENTES: Batatas desidratadas, \u00f3leo de girasol, farinha de trigo.(aimha d mh e o, Pode conter leite, soja. Consumir de prefer\u00ebncia antes de: ver fundo (BB), Enbazhyer OHTS Pttas deshidratadas, aceite de qirasol, harina de trigo, harina de maiz, haia ca rm e eche, soja. Consumir preferentemente antes del: ver parte interior (8B), Enast et 'Releenc itle dn 100 g | RI&quot; /30g| Eectsge/Ayt acuilo medo 84U bole / Prodoth te /30g ji begja /Valor energetico Tpas (Grassi/ Unjdos / Grasas tan e\u1eadticte Fets\u00e4uren / dont 2214 kJ 664 kJ 530 kcal 159 kcal adulo medio / 8% 31g 3.0 9 9.3 0.9g 17g 13% Produoad by: see yd Aii dd cassi satui / dos quais Producido por urdes thtrde | Glucites | 5% oidrati / MedaCoyK Sabd 55g 7% Uont sucres /di eui *FRSCAME QNg",1],["25% noci, 25% mandorle, 25% uva sultanina (99,5% uva sultanina, olio di semi di girasole), 25% mirtilli rossi americani, essiccati e zuccherati (60% mirtilli rossi americani, 39% zucchero, olio di semi di girasole). Pu\u00f2 contenere tracce di altra frutta a guscio e arachidi. Confezionato in atmosfera protettiva.",1]]},"kind":"categorical","n":50,"n_null":34,"n_unique":12,"null_rate":0.68,"stats":{"cardinality":12,"entropy":3.274397470347699,"entropy_ratio":0.9133700756113953,"top_rate":0.3125,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"60.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_de","extras":{"singletons":0,"top_values":[["",20]]},"kind":"categorical","n":50,"n_null":30,"n_unique":1,"null_rate":0.6,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=-2.06"}],"column":"nova_group","extras":{"histogram":{"counts":[1,0,0,0,14,33],"edges":[1.0,1.5,2.0,2.5,3.0,3.5,4.0]},"sample":[3.0,4.0,3.0,3.0,4.0,4.0,1.0,4.0,4.0,3.0,4.0,4.0,3.0,3.0,3.0,3.0,3.0,4.0,4.0,3.0,4.0,4.0,4.0,3.0,4.0,3.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,3.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,3.0,4.0,4.0,4.0,4.0,4.0,4.0]},"kind":"numeric","n":50,"n_null":2,"n_unique":3,"null_rate":0.04,"stats":{"iqr":1.0,"kurtosis":5.651377168881027,"max":4.0,"mean":3.6458333333333335,"median":4.0,"min":1.0,"n_outliers":1,"outlier_rate":0.020833333333333332,"q1":3.0,"q3":4.0,"skew":-2.0624248677777532,"std":0.6010481388776002,"zero_rate":0.0}},{"alerts":[{"code":"null_rate","level":"warn","message":"90.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_fi","extras":{"singletons":0,"top_values":[["",5]]},"kind":"categorical","n":50,"n_null":45,"n_unique":1,"null_rate":0.9,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"16 singleton categories"}],"column":"states","extras":{"singletons":16,"top_values":[["en:to-be-completed, en:nutrition-facts-completed, en:ingredients-completed, en:expiration-date-completed, en:packaging-code-to-be-completed, en:characteristics-to-be-completed, en:origins-to-be-completed, en:categories-completed, en:brands-completed, en:packaging-completed, en:quantity-completed, en:product-name-completed, en:photos-validated, en:packaging-photo-selected, en:nutrition-photo-selected, en:ingredients-photo-selected, en:front-photo-selected, en:photos-uploaded",8],["en:to-be-checked, en:complete, en:nutrition-facts-completed, en:ingredients-completed, en:expiration-date-completed, en:packaging-code-completed, en:characteristics-completed, en:origins-completed, en:categories-completed, en:brands-completed, en:packaging-completed, en:quantity-completed, en:product-name-completed, en:photos-validated, en:packaging-photo-selected, en:nutrition-photo-selected, en:ingredients-photo-selected, en:front-photo-selected, en:photos-uploaded",6],["en:to-be-completed, en:nutrition-facts-completed, en:ingredients-completed, en:expiration-date-completed, en:packaging-code-to-be-completed, en:characteristics-to-be-completed, en:origins-to-be-completed, en:categories-completed, en:brands-completed, en:packaging-completed, en:quantity-completed, en:product-name-completed, en:photos-to-be-validated, en:packaging-photo-to-be-selected, en:nutrition-photo-selected, en:ingredients-photo-selected, en:front-photo-selected, en:photos-uploaded",5],["en:to-be-checked, en:complete, en:nutrition-facts-completed, en:ingredients-completed, en:expiration-date-completed, en:packaging-code-to-be-completed, en:characteristics-completed, en:origins-completed, en:categories-completed, en:brands-completed, en:packaging-completed, en:quantity-completed, en:product-name-completed, en:photos-validated, en:packaging-photo-selected, en:nutrition-photo-selected, en:ingredients-photo-selected, en:front-photo-selected, en:photos-uploaded",3],["en:to-be-completed, en:nutrition-facts-completed, en:ingredients-completed, en:expiration-date-to-be-completed, en:packaging-code-to-be-completed, en:characteristics-to-be-completed, en:origins-to-be-completed, en:categories-completed, en:brands-completed, en:packaging-to-be-completed, en:quantity-to-be-completed, en:product-name-completed, en:photos-to-be-validated, en:packaging-photo-to-be-selected, en:nutrition-photo-selected, en:ingredients-photo-selected, en:front-photo-selected, en:photos-uploaded",2],["en:checked, en:complete, en:nutrition-facts-completed, en:ingredients-completed, en:expiration-date-completed, en:packaging-code-completed, en:characteristics-completed, en:origins-completed, en:categories-completed, en:brands-completed, en:packaging-completed, en:quantity-completed, en:product-name-completed, en:photos-validated, en:packaging-photo-selected, en:nutrition-photo-selected, en:ingredients-photo-selected, en:front-photo-selected, en:photos-uploaded",2],["en:to-be-completed, en:nutrition-facts-completed, en:ingredients-completed, en:expiration-date-to-be-completed, en:packaging-code-to-be-completed, en:characteristics-completed, en:origins-completed, en:categories-completed, en:brands-completed, en:packaging-completed, en:quantity-completed, en:product-name-completed, en:photos-to-be-validated, en:packaging-photo-to-be-selected, en:nutrition-photo-selected, en:ingredients-photo-selected, en:front-photo-selected, en:photos-uploaded",2],["en:to-be-completed, en:nutrition-facts-completed, en:ingredients-completed, en:expiration-date-to-be-completed, en:packaging-code-to-be-completed, en:characteristics-to-be-completed, en:origins-to-be-completed, en:categories-completed, en:brands-completed, en:packaging-to-be-completed, en:quantity-completed, en:product-name-completed, en:photos-to-be-validated, en:packaging-photo-to-be-selected, en:nutrition-photo-selected, en:ingredients-photo-selected, en:front-photo-selected, en:photos-uploaded",2],["en:to-be-completed, en:nutrition-facts-completed, en:ingredients-completed, en:expiration-date-completed, en:packaging-code-to-be-completed, en:characteristics-completed, en:origins-completed, en:categories-completed, en:brands-completed, en:packaging-completed, en:quantity-completed, en:product-name-completed, en:photos-to-be-validated, en:packaging-photo-to-be-selected, en:nutrition-photo-selected, en:ingredients-photo-selected, en:front-photo-selected, en:photos-uploaded",2],["en:to-be-checked, en:complete, en:nutrition-facts-completed, en:ingredients-completed, en:expiration-date-to-be-completed, en:packaging-code-to-be-completed, en:characteristics-completed, en:origins-completed, en:categories-completed, en:brands-completed, en:packaging-completed, en:quantity-completed, en:product-name-completed, en:photos-validated, en:packaging-photo-selected, en:nutrition-photo-selected, en:ingredients-photo-selected, en:front-photo-selected, en:photos-uploaded",2],["en:to-be-completed, en:nutrition-facts-completed, en:ingredients-completed, en:expiration-date-completed, en:packaging-code-completed, en:characteristics-completed, en:origins-completed, en:categories-completed, en:brands-completed, en:packaging-completed, en:quantity-completed, en:product-name-completed, en:photos-to-be-validated, en:packaging-photo-to-be-selected, en:nutrition-photo-to-be-selected, en:ingredients-photo-selected, en:front-photo-to-be-selected, en:photos-uploaded",1],["en:to-be-completed, en:nutrition-facts-completed, en:ingredients-completed, en:expiration-date-completed, en:packaging-code-to-be-completed, en:characteristics-to-be-completed, en:origins-to-be-completed, en:categories-completed, en:brands-completed, en:packaging-completed, en:quantity-completed, en:product-name-completed, en:photos-to-be-validated, en:packaging-photo-selected, en:nutrition-photo-selected, en:ingredients-photo-selected, en:front-photo-to-be-selected, en:photos-uploaded",1],["en:to-be-completed, en:nutrition-facts-completed, en:ingredients-completed, en:expiration-date-to-be-completed, en:packaging-code-to-be-completed, en:characteristics-to-be-completed, en:origins-completed, en:categories-completed, en:brands-completed, en:packaging-to-be-completed, en:quantity-completed, en:product-name-completed, en:photos-validated, en:packaging-photo-selected, en:nutrition-photo-selected, en:ingredients-photo-selected, en:front-photo-selected, en:photos-uploaded",1],["en:checked, en:complete, en:nutrition-facts-completed, en:ingredients-completed, en:expiration-date-completed, en:packaging-code-to-be-completed, en:characteristics-completed, en:origins-completed, en:categories-completed, en:brands-completed, en:packaging-completed, en:quantity-completed, en:product-name-completed, en:photos-validated, en:packaging-photo-selected, en:nutrition-photo-selected, en:ingredients-photo-selected, en:front-photo-selected, en:photos-uploaded",1],["en:to-be-completed, en:nutrition-facts-completed, en:ingredients-completed, en:expiration-date-completed, en:packaging-code-completed, en:characteristics-to-be-completed, en:origins-to-be-completed, en:categories-completed, en:brands-completed, en:packaging-completed, en:quantity-completed, en:product-name-completed, en:photos-to-be-validated, en:packaging-photo-to-be-selected, en:nutrition-photo-selected, en:ingredients-photo-selected, en:front-photo-selected, en:photos-uploaded",1],["en:to-be-completed, en:nutrition-facts-completed, en:ingredients-completed, en:expiration-date-to-be-completed, en:packaging-code-to-be-completed, en:characteristics-to-be-completed, en:origins-to-be-completed, en:categories-completed, en:brands-completed, en:packaging-completed, en:quantity-completed, en:product-name-completed, en:photos-to-be-validated, en:packaging-photo-to-be-selected, en:nutrition-photo-selected, en:ingredients-photo-selected, en:front-photo-selected, en:photos-uploaded",1],["en:to-be-completed, en:nutrition-facts-completed, en:ingredients-completed, en:expiration-date-completed, en:packaging-code-to-be-completed, en:characteristics-to-be-completed, en:origins-to-be-completed, en:categories-completed, en:brands-completed, en:packaging-completed, en:quantity-completed, en:product-name-to-be-completed, en:photos-to-be-validated, en:packaging-photo-to-be-selected, en:nutrition-photo-selected, en:ingredients-photo-selected, en:front-photo-selected, en:photos-uploaded",1],["en:to-be-completed, en:nutrition-facts-completed, en:ingredients-completed, en:expiration-date-to-be-completed, en:packaging-code-completed, en:characteristics-to-be-completed, en:origins-to-be-completed, en:categories-completed, en:brands-completed, en:packaging-completed, en:quantity-completed, en:product-name-completed, en:photos-validated, en:packaging-photo-selected, en:nutrition-photo-selected, en:ingredients-photo-selected, en:front-photo-selected, en:photos-uploaded",1],["en:to-be-completed, en:nutrition-facts-completed, en:ingredients-completed, en:expiration-date-to-be-completed, en:packaging-code-completed, en:characteristics-completed, en:origins-completed, en:categories-completed, en:brands-completed, en:packaging-completed, en:quantity-completed, en:product-name-completed, en:photos-to-be-validated, en:packaging-photo-to-be-selected, en:nutrition-photo-selected, en:ingredients-photo-selected, en:front-photo-selected, en:photos-uploaded",1],["en:checked, en:complete, en:nutrition-facts-completed, en:ingredients-completed, en:expiration-date-to-be-completed, en:packaging-code-to-be-completed, en:characteristics-completed, en:origins-completed, en:categories-completed, en:brands-completed, en:packaging-completed, en:quantity-completed, en:product-name-completed, en:photos-validated, en:packaging-photo-selected, en:nutrition-photo-selected, en:ingredients-photo-selected, en:front-photo-selected, en:photos-uploaded",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":26,"null_rate":0.0,"stats":{"cardinality":26,"entropy":4.286370130156181,"entropy_ratio":0.9119083292597431,"top_rate":0.16,"top_value":"en:to-be-completed, en:nutrition-facts-completed, en:ingredients-completed, en:expiration-date-completed, en:packaging-code-to-be-completed, en:characteristics-to-be-completed, en:origins-to-be-completed, en:categories-completed, en:brands-completed, en:packaging-completed, en:quantity-completed, en:product-name-completed, en:photos-validated, en:packaging-photo-selected, en:nutrition-photo-selected, en:ingredients-photo-selected, en:front-photo-selected, en:photos-uploaded"}},{"alerts":[],"column":"ingredients_with_unspecified_percent_sum","extras":{"histogram":{"counts":[2,4,4,3,2,1,34],"edges":[0.400000000000006,14.628571428571433,28.85714285714286,43.08571428571429,57.31428571428572,71.54285714285714,85.77142857142857,100.0]},"sample":[100.0,45.5,100.0,58.4,21.6,100.0,100.0,100.0,100.0,100.0,100.0,100.0,80.0,100.0,100.0,100.0,100.0,100.0,43.0,100.0,93.0,100.0,96.6,100.0,100.0,100.0,0.400000000000006,23.625,100.0,100.0,70.9,100.0,37.0,22.4,100.0,96.875,89.0,35.0,100.0,100.0,100.0,97.0,100.0,50.0,30.0,27.0,100.0,100.0,52.0,1.5]},"kind":"numeric","n":50,"n_null":0,"n_unique":22,"null_rate":0.0,"stats":{"iqr":46.4,"kurtosis":-0.13296797482234624,"max":100.0,"mean":79.416,"median":100.0,"min":0.400000000000006,"n_outliers":0,"outlier_rate":0.0,"q1":53.6,"q3":100.0,"skew":-1.1831449512529044,"std":31.643022718044712,"zero_rate":0.0}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"added_countries_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"50 singleton categories"}],"column":"id","extras":{"singletons":50,"top_values":[["6111242100992",1],["7622210449283",1],["3046920029759",1],["6111031005064",1],["3175680011480",1],["20995553",1],["3268840001008",1],["3362600011044",1],["8425197712024",1],["7622210578464",1],["6111259343108",1],["3362600011228",1],["8000500310427",1],["7300400481595",1],["3046920022651",1],["5060042641000",1],["7622210584724",1],["3046920022606",1],["3229820100234",1],["20022464",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":50,"null_rate":0.0,"stats":{"cardinality":50,"entropy":5.643856189774725,"entropy_ratio":1.0000000000000002,"top_rate":0.02,"top_value":"6111242100992"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"nutrient_levels","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=-2.78"},{"code":"outliers","level":"warn","message":"9.1% rows beyond 1.5 IQR"}],"column":"sortkey","extras":{"histogram":{"counts":[1,1,1,1,5,35],"edges":[1567543172.0,1574768917.3333333,1581994662.6666667,1589220408.0,1596446153.3333333,1603671898.6666667,1610897644.0]},"sample":[1604164775.0,1610831524.0,1608126304.0,1606998333.0,1610820940.0,1609688069.0,1587624148.0,1606404876.0,1567543172.0,1608169428.0,1602712677.0,1610688704.0,1610107581.0,1604036584.0,1603184519.0,1593280301.0,1610112624.0,1609965904.0,1610049599.0,1607234952.0,1601542200.0,1608668130.0,1610051174.0,1610897644.0,1607291257.0,1603718355.0,1578756211.0,1610482411.0,1610132341.0,1610270622.0,1607720823.0,1610102153.0,1610818254.0,1610733064.0,1608725878.0,1610564128.0,1602617430.0,1604237611.0,1596955187.0,1608125950.0,1603718751.0,1604574937.0,1609150955.0,1610819061.0]},"kind":"numeric","n":50,"n_null":6,"n_unique":44,"null_rate":0.12,"stats":{"iqr":6160427.5,"kurtosis":8.091492742001634,"max":1610897644.0,"mean":1605282262.2954545,"median":1608147866.0,"min":1567543172.0,"n_outliers":4,"outlier_rate":0.09090909090909091,"q1":1603957125.75,"q3":1610117553.25,"skew":-2.7817834673396575,"std":8691752.954401061,"zero_rate":0.0}},{"alerts":[{"code":"long_tail","level":"info","message":"50 singleton categories"}],"column":"image_small_url","extras":{"singletons":50,"top_values":[["https://images.openfoodfacts.org/images/products/611/124/210/0992/front_fr.172.200.jpg",1],["https://images.openfoodfacts.org/images/products/762/221/044/9283/front_en.605.200.jpg",1],["https://images.openfoodfacts.org/images/products/304/692/002/9759/front_en.492.200.jpg",1],["https://images.openfoodfacts.org/images/products/611/103/100/5064/front_fr.56.200.jpg",1],["https://images.openfoodfacts.org/images/products/317/568/001/1480/front_en.221.200.jpg",1],["https://images.openfoodfacts.org/images/products/000/002/099/5553/front_en.314.200.jpg",1],["https://images.openfoodfacts.org/images/products/326/884/000/1008/front_fr.422.200.jpg",1],["https://images.openfoodfacts.org/images/products/336/260/001/1044/front_fr.50.200.jpg",1],["https://images.openfoodfacts.org/images/products/842/519/771/2024/front_en.60.200.jpg",1],["https://images.openfoodfacts.org/images/products/762/221/057/8464/front_en.29.200.jpg",1],["https://images.openfoodfacts.org/images/products/611/125/934/3108/front_fr.25.200.jpg",1],["https://images.openfoodfacts.org/images/products/336/260/001/1228/front_fr.38.200.jpg",1],["https://images.openfoodfacts.org/images/products/800/050/031/0427/front_fr.488.200.jpg",1],["https://images.openfoodfacts.org/images/products/730/040/048/1595/front_fr.242.200.jpg",1],["https://images.openfoodfacts.org/images/products/304/692/002/2651/front_en.159.200.jpg",1],["https://images.openfoodfacts.org/images/products/506/004/264/1000/front_en.179.200.jpg",1],["https://images.openfoodfacts.org/images/products/762/221/058/4724/front_en.95.200.jpg",1],["https://images.openfoodfacts.org/images/products/304/692/002/2606/front_en.102.200.jpg",1],["https://images.openfoodfacts.org/images/products/322/982/010/0234/front_fr.246.200.jpg",1],["https://images.openfoodfacts.org/images/products/000/002/002/2464/front_en.301.200.jpg",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":50,"null_rate":0.0,"stats":{"cardinality":50,"entropy":5.643856189774725,"entropy_ratio":1.0000000000000002,"top_rate":0.02,"top_value":"https://images.openfoodfacts.org/images/products/611/124/210/0992/front_fr.172.200.jpg"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"packaging_recycling_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[],"column":"food_groups","extras":{"singletons":5,"top_values":[["en:biscuits-and-cakes",17],["en:chocolate-products",16],["en:appetizers",4],["en:pastries",3],["en:bread",2],["en:sweets",2],["en:dairy-desserts",1],["en:unsweetened-beverages",1],["en:cereals",1],["en:dried-fruits",1],["en:cereals-and-potatoes",1]]},"kind":"categorical","n":50,"n_null":1,"n_unique":11,"null_rate":0.02,"stats":{"cardinality":11,"entropy":2.548551562412775,"entropy_ratio":0.7366966147510304,"top_rate":0.3469387755102041,"top_value":"en:biscuits-and-cakes"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"nova_groups_markers","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"null_rate","level":"warn","message":"60.0% null"}],"column":"packaging_text_de","extras":{"singletons":1,"top_values":[["",19],["1 Folie aus 22 PAP zum Recyclen",1]]},"kind":"categorical","n":50,"n_null":30,"n_unique":2,"null_rate":0.6,"stats":{"cardinality":2,"entropy":0.28639695711595625,"entropy_ratio":0.28639695711595625,"top_rate":0.95,"top_value":""}},{"alerts":[],"column":"categories_lc","extras":{"singletons":2,"top_values":[["fr",25],["en",19],["es",2],["de",2],["it",1],["pl",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":6,"null_rate":0.0,"stats":{"cardinality":6,"entropy":1.6277156397787997,"entropy_ratio":0.6296863646279965,"top_rate":0.5,"top_value":"fr"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"checkers","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"null_rate","level":"warn","message":"60.0% null"}],"column":"packaging_text_es","extras":{"singletons":1,"top_values":[["",19],["1 caja de cart\u00f3n para reciclar, 1 bandeja de pl\u00e1stico para reciclar",1]]},"kind":"categorical","n":50,"n_null":30,"n_unique":2,"null_rate":0.6,"stats":{"cardinality":2,"entropy":0.28639695711595625,"entropy_ratio":0.28639695711595625,"top_rate":0.95,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"unknown_nutrients_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"editors_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"constant","level":"info","message":"only one distinct value"}],"column":"nutrition_score_warning_fruits_vegetables_nuts_estimate_from_ingredients","extras":{"histogram":{"counts":[0,0,0,45,0,0],"edges":[0.5,0.6666666666666666,0.8333333333333333,1.0,1.1666666666666665,1.3333333333333333,1.5]},"sample":[1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0]},"kind":"numeric","n":50,"n_null":5,"n_unique":1,"null_rate":0.1,"stats":{"iqr":0.0,"kurtosis":0.0,"max":1.0,"mean":1.0,"median":1.0,"min":1.0,"n_outliers":0,"outlier_rate":0.0,"q1":1.0,"q3":1.0,"skew":0.0,"std":0.0,"zero_rate":0.0}},{"alerts":[],"column":"labels_lc","extras":{"singletons":3,"top_values":[["en",22],["fr",22],["es",2],["de",1],["it",1],["pl",1]]},"kind":"categorical","n":50,"n_null":1,"n_unique":6,"null_rate":0.02,"stats":{"cardinality":6,"entropy":1.5695059416653905,"entropy_ratio":0.607167779504549,"top_rate":0.4489795918367347,"top_value":"en"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"nutriscore_data","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"other_nutritional_substances_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"96.0% null"}],"column":"product_name_nb","extras":{"singletons":2,"top_values":[["",1],["99% m\u00f8rk sjokolade",1]]},"kind":"categorical","n":50,"n_null":48,"n_unique":2,"null_rate":0.96,"stats":{"cardinality":2,"entropy":1.0,"entropy_ratio":1.0,"top_rate":0.5,"top_value":""}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"nutrition_data_prepared_per","extras":{"singletons":0,"top_values":[["100g",50]]},"kind":"categorical","n":50,"n_null":0,"n_unique":1,"null_rate":0.0,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"100g"}},{"alerts":[{"code":"long_tail","level":"info","message":"18 singleton categories"}],"column":"product_quantity","extras":{"singletons":18,"top_values":[["100",11],["230",3],["42",3],["125",2],["500",2],["150",2],["90",2],["0",2],["200",2],["300",1],["22",1],["304",1],["275",1],["225",1],["85",1],["36",1],["160",1],["20",1],["750",1],["175",1]]},"kind":"categorical","n":50,"n_null":3,"n_unique":27,"null_rate":0.06,"stats":{"cardinality":27,"entropy":4.287279855734294,"entropy_ratio":0.9016574742901039,"top_rate":0.23404255319148937,"top_value":"100"}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"product_type","extras":{"singletons":0,"top_values":[["food",50]]},"kind":"categorical","n":50,"n_null":0,"n_unique":1,"null_rate":0.0,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"food"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"checkers_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"nucleotides_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"languages_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[],"column":"traces_lc","extras":{"singletons":3,"top_values":[["fr",23],["en",20],["es",2],["de",1],["it",1],["pl",1]]},"kind":"categorical","n":50,"n_null":2,"n_unique":6,"null_rate":0.04,"stats":{"cardinality":6,"entropy":1.5749523572407698,"entropy_ratio":0.6092747406592504,"top_rate":0.4791666666666667,"top_value":"fr"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"categories_hierarchy","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"50 singleton categories"}],"column":"image_front_small_url","extras":{"singletons":50,"top_values":[["https://images.openfoodfacts.org/images/products/611/124/210/0992/front_fr.172.200.jpg",1],["https://images.openfoodfacts.org/images/products/762/221/044/9283/front_en.605.200.jpg",1],["https://images.openfoodfacts.org/images/products/304/692/002/9759/front_en.492.200.jpg",1],["https://images.openfoodfacts.org/images/products/611/103/100/5064/front_fr.56.200.jpg",1],["https://images.openfoodfacts.org/images/products/317/568/001/1480/front_en.221.200.jpg",1],["https://images.openfoodfacts.org/images/products/000/002/099/5553/front_en.314.200.jpg",1],["https://images.openfoodfacts.org/images/products/326/884/000/1008/front_fr.422.200.jpg",1],["https://images.openfoodfacts.org/images/products/336/260/001/1044/front_fr.50.200.jpg",1],["https://images.openfoodfacts.org/images/products/842/519/771/2024/front_en.60.200.jpg",1],["https://images.openfoodfacts.org/images/products/762/221/057/8464/front_en.29.200.jpg",1],["https://images.openfoodfacts.org/images/products/611/125/934/3108/front_fr.25.200.jpg",1],["https://images.openfoodfacts.org/images/products/336/260/001/1228/front_fr.38.200.jpg",1],["https://images.openfoodfacts.org/images/products/800/050/031/0427/front_fr.488.200.jpg",1],["https://images.openfoodfacts.org/images/products/730/040/048/1595/front_fr.242.200.jpg",1],["https://images.openfoodfacts.org/images/products/304/692/002/2651/front_en.159.200.jpg",1],["https://images.openfoodfacts.org/images/products/506/004/264/1000/front_en.179.200.jpg",1],["https://images.openfoodfacts.org/images/products/762/221/058/4724/front_en.95.200.jpg",1],["https://images.openfoodfacts.org/images/products/304/692/002/2606/front_en.102.200.jpg",1],["https://images.openfoodfacts.org/images/products/322/982/010/0234/front_fr.246.200.jpg",1],["https://images.openfoodfacts.org/images/products/000/002/002/2464/front_en.301.200.jpg",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":50,"null_rate":0.0,"stats":{"cardinality":50,"entropy":5.643856189774725,"entropy_ratio":1.0000000000000002,"top_rate":0.02,"top_value":"https://images.openfoodfacts.org/images/products/611/124/210/0992/front_fr.172.200.jpg"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"entry_dates_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"ecoscore_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"constant","level":"info","message":"only one distinct value"}],"column":"nutrition_score_warning_fruits_vegetables_legumes_estimate_from_ingredients","extras":{"histogram":{"counts":[0,0,0,46,0,0],"edges":[0.5,0.6666666666666666,0.8333333333333333,1.0,1.1666666666666665,1.3333333333333333,1.5]},"sample":[1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0]},"kind":"numeric","n":50,"n_null":4,"n_unique":1,"null_rate":0.08,"stats":{"iqr":0.0,"kurtosis":0.0,"max":1.0,"mean":1.0,"median":1.0,"min":1.0,"n_outliers":0,"outlier_rate":0.0,"q1":1.0,"q3":1.0,"skew":0.0,"std":0.0,"zero_rate":0.0}},{"alerts":[],"column":"ingredients_without_ciqual_codes_n","extras":{"histogram":{"counts":[25,9,8,4,3,0,1],"edges":[0.0,3.142857142857143,6.285714285714286,9.428571428571429,12.571428571428571,15.714285714285714,18.857142857142858,22.0]},"sample":[1.0,8.0,1.0,12.0,14.0,2.0,0.0,6.0,2.0,0.0,5.0,7.0,12.0,0.0,1.0,0.0,0.0,1.0,4.0,3.0,0.0,6.0,8.0,7.0,1.0,7.0,0.0,14.0,3.0,1.0,3.0,6.0,5.0,8.0,0.0,3.0,11.0,8.0,3.0,5.0,9.0,13.0,2.0,0.0,2.0,6.0,22.0,4.0,11.0,2.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":15,"null_rate":0.0,"stats":{"iqr":6.75,"kurtosis":1.4912337586248299,"max":22.0,"mean":4.98,"median":3.5,"min":0.0,"n_outliers":1,"outlier_rate":0.02,"q1":1.0,"q3":7.75,"skew":1.2078753068069035,"std":4.8254850660269355,"zero_rate":0.18}},{"alerts":[],"column":"rev","extras":{"histogram":{"counts":[15,9,12,6,3,3,2],"edges":[19.0,112.57142857142857,206.14285714285714,299.7142857142857,393.2857142857143,486.85714285714283,580.4285714285714,674.0]},"sample":[177.0,674.0,509.0,59.0,306.0,342.0,441.0,51.0,65.0,72.0,28.0,44.0,492.0,242.0,243.0,271.0,104.0,264.0,271.0,317.0,344.0,32.0,47.0,578.0,402.0,41.0,120.0,261.0,27.0,291.0,299.0,273.0,148.0,168.0,344.0,443.0,28.0,225.0,615.0,176.0,19.0,75.0,200.0,177.0,312.0,247.0,141.0,23.0,293.0,179.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":46,"null_rate":0.0,"stats":{"iqr":237.75,"kurtosis":-0.022781799852933826,"max":674.0,"mean":230.0,"median":233.5,"min":19.0,"n_outliers":1,"outlier_rate":0.02,"q1":72.75,"q3":310.5,"skew":0.7091813805505103,"std":166.63708581029294,"zero_rate":0.0}},{"alerts":[{"code":"constant","level":"info","message":"only one distinct value"}],"column":"ingredients_non_nutritive_sweeteners_n","extras":{"histogram":{"counts":[0,0,0,50,0,0,0],"edges":[-0.5,-0.35714285714285715,-0.2142857142857143,-0.07142857142857145,0.0714285714285714,0.2142857142857142,0.3571428571428571,0.5]},"sample":[0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":1,"null_rate":0.0,"stats":{"iqr":0.0,"kurtosis":0.0,"max":0.0,"mean":0.0,"median":0.0,"min":0.0,"n_outliers":0,"outlier_rate":0.0,"q1":0.0,"q3":0.0,"skew":0.0,"std":0.0,"zero_rate":1.0}},{"alerts":[],"column":"ingredients_without_ecobalyse_ids_n","extras":{"histogram":{"counts":[15,16,8,6,3,1,1],"edges":[0.0,4.142857142857143,8.285714285714286,12.42857142857143,16.571428571428573,20.714285714285715,24.85714285714286,29.0]},"sample":[2.0,13.0,4.0,13.0,18.0,6.0,0.0,7.0,6.0,3.0,5.0,9.0,21.0,2.0,3.0,1.0,4.0,4.0,7.0,7.0,5.0,6.0,11.0,9.0,3.0,14.0,1.0,18.0,5.0,5.0,4.0,8.0,8.0,10.0,3.0,6.0,15.0,11.0,7.0,10.0,16.0,13.0,4.0,3.0,5.0,11.0,29.0,9.0,19.0,5.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":20,"null_rate":0.0,"stats":{"iqr":7.0,"kurtosis":1.7428354597083384,"max":29.0,"mean":8.16,"median":6.5,"min":0.0,"n_outliers":1,"outlier_rate":0.02,"q1":4.0,"q3":11.0,"skew":1.2802510763551924,"std":5.898322141222252,"zero_rate":0.02}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"environment_impact_level_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"last_image_dates_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"labels_hierarchy","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"33 singleton categories"}],"column":"product_name_en","extras":{"singletons":33,"top_values":[["",10],["Perly",1],["Prince Gout Chocolat",1],["Edelbitter-Schokolade",1],["tonik",1],["Gerbl\u00e9 - Sesame Cookie, 230g (8.2oz)",1],["Chocolat noir - 85% cacao",1],["Hhhhh",1],["Organic 70% Dark Chocolate Bar",1],["biscuits",1],["AUTHENTIQUE",1],["Tyrell's Lightly Sea Salted",1],["Intense dark chocolate",1],["Excellence 85% Cacao Chocolat Noir Puissant Lindt % Lindt",1],["Filled - Dark Chocolate",1],["Extra dark 74% Cocoa",1],["Fine Rye Crispbread - Fibre",1],["Tuc Original",1],["Intense Dark 70% Cocoa",1],["Gerbl\u00e9 - Apple Hazelnut Cookie, 230g (8.2oz)",1]]},"kind":"categorical","n":50,"n_null":7,"n_unique":34,"null_rate":0.14,"stats":{"cardinality":34,"entropy":4.653723337286433,"entropy_ratio":0.9147434551369997,"top_rate":0.23255813953488372,"top_value":""}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=+5.93"},{"code":"outliers","level":"warn","message":"10.9% rows beyond 1.5 IQR"}],"column":"nutrition_score_warning_fruits_vegetables_legumes_estimate_from_ingredients_value","extras":{"histogram":{"counts":[44,1,0,0,0,1],"edges":[0.0,8.333333333333334,16.666666666666668,25.0,33.333333333333336,41.66666666666667,50.0]},"sample":[5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,10.6,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5.3,0.0,0.0,0.0,0.0,5.1,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,50.0,0.0,0.0,0.0,0.0,0.0]},"kind":"numeric","n":50,"n_null":4,"n_unique":6,"null_rate":0.08,"stats":{"iqr":0.0,"kurtosis":35.22580605190707,"max":50.0,"mean":1.6521739130434783,"median":0.0,"min":0.0,"n_outliers":5,"outlier_rate":0.10869565217391304,"q1":0.0,"q3":0.0,"skew":5.931640486056859,"std":7.551151174355539,"zero_rate":0.8913043478260869}},{"alerts":[{"code":"long_tail","level":"info","message":"16 singleton categories"}],"column":"traces","extras":{"singletons":16,"top_values":[["",11],["en:milk,en:nuts",7],["en:nuts",5],["en:milk,en:nuts,en:sesame-seeds,en:soybeans",4],["en:milk,en:soybeans",3],["en:soybeans",2],["en:lupin,en:milk,en:nuts,en:sesame-seeds,en:soybeans",2],["en:eggs",1],["en:milk,en:nuts,en:soybeans",1],["en:eggs,en:lupin,en:milk,en:mustard,en:nuts,en:soybeans",1],["en:mustard",1],["en:lupin,en:milk,en:mustard,en:sesame-seeds,en:soybeans",1],["en:milk",1],["en:eggs,en:mustard,en:nuts,en:sesame-seeds,en:soybeans",1],["en:gluten,en:Amande,en:Arachides,en:Avoine,en:Bl\u00e9,en:Lait,en:Noisettes,en:Noix,en:Noix de cajou,en:Noix de macadamia,en:Noix de p\u00e9can,en:Noix du br\u00e9sil,en:Orge,en:Pistaches,en:Seigle",1],["en:lupin,en:milk,en:mustard,en:soybeans",1],["en:gluten,en:milk",1],["en:gluten,en:nuts,en:peanuts,en:soybeans",1],["en:nuts,en:peanuts,en:soybeans",1],["en:gluten,en:nuts",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":23,"null_rate":0.0,"stats":{"cardinality":23,"entropy":3.9224609850544483,"entropy_ratio":0.8671177764686753,"top_rate":0.22,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"5 singleton categories"},{"code":"null_rate","level":"warn","message":"90.0% null"}],"column":"generic_name_fi","extras":{"singletons":5,"top_values":[["Hieno tumma suklaa jossa 90% kaakaota",1],["Tumma suklaa",1],["tumma suklaa",1],["Keksej\u00e4",1],["",1]]},"kind":"categorical","n":50,"n_null":45,"n_unique":5,"null_rate":0.9,"stats":{"cardinality":5,"entropy":2.321928094887362,"entropy_ratio":1.0,"top_rate":0.2,"top_value":"Hieno tumma suklaa jossa 90% kaakaota"}},{"alerts":[{"code":"long_tail","level":"info","message":"3 singleton categories"},{"code":"null_rate","level":"warn","message":"34.0% null"}],"column":"emb_codes_orig","extras":{"singletons":3,"top_values":[["",28],["EMB 31250",2],["EMB 44068A",1],["SOLENT GMBH & CO. KG,SCHWARZ BETEILIGUNGS GMBH",1],["EMB 64422",1]]},"kind":"categorical","n":50,"n_null":17,"n_unique":5,"null_rate":0.34,"stats":{"cardinality":5,"entropy":0.9048202460974559,"entropy_ratio":0.3896848692643728,"top_rate":0.8484848484848485,"top_value":""}},{"alerts":[],"column":"ingredients_with_specified_percent_n","extras":{"histogram":{"counts":[36,5,3,4,1,0,1],"edges":[0.0,1.1428571428571428,2.2857142857142856,3.4285714285714284,4.571428571428571,5.7142857142857135,6.857142857142857,8.0]},"sample":[0.0,3.0,0.0,1.0,4.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,2.0,4.0,0.0,0.0,3.0,0.0,2.0,4.0,0.0,1.0,1.0,3.0,0.0,0.0,0.0,1.0,0.0,2.0,1.0,4.0,0.0,0.0,2.0,8.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":7,"null_rate":0.0,"stats":{"iqr":2.0,"kurtosis":3.676385281133153,"max":8.0,"mean":1.1,"median":0.0,"min":0.0,"n_outliers":1,"outlier_rate":0.02,"q1":0.0,"q3":2.0,"skew":1.878233024035634,"std":1.729102633844315,"zero_rate":0.58}},{"alerts":[],"column":"nutrition_grades","extras":{"singletons":1,"top_values":[["e",27],["d",9],["c",7],["a",4],["b",2],["unknown",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":6,"null_rate":0.0,"stats":{"cardinality":6,"entropy":1.9126007492587709,"entropy_ratio":0.7398949689696431,"top_rate":0.54,"top_value":"e"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"weighers_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"categories_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"50 singleton categories"}],"column":"image_url","extras":{"singletons":50,"top_values":[["https://images.openfoodfacts.org/images/products/611/124/210/0992/front_fr.172.400.jpg",1],["https://images.openfoodfacts.org/images/products/762/221/044/9283/front_en.605.400.jpg",1],["https://images.openfoodfacts.org/images/products/304/692/002/9759/front_en.492.400.jpg",1],["https://images.openfoodfacts.org/images/products/611/103/100/5064/front_fr.56.400.jpg",1],["https://images.openfoodfacts.org/images/products/317/568/001/1480/front_en.221.400.jpg",1],["https://images.openfoodfacts.org/images/products/000/002/099/5553/front_en.314.400.jpg",1],["https://images.openfoodfacts.org/images/products/326/884/000/1008/front_fr.422.400.jpg",1],["https://images.openfoodfacts.org/images/products/336/260/001/1044/front_fr.50.400.jpg",1],["https://images.openfoodfacts.org/images/products/842/519/771/2024/front_en.60.400.jpg",1],["https://images.openfoodfacts.org/images/products/762/221/057/8464/front_en.29.400.jpg",1],["https://images.openfoodfacts.org/images/products/611/125/934/3108/front_fr.25.400.jpg",1],["https://images.openfoodfacts.org/images/products/336/260/001/1228/front_fr.38.400.jpg",1],["https://images.openfoodfacts.org/images/products/800/050/031/0427/front_fr.488.400.jpg",1],["https://images.openfoodfacts.org/images/products/730/040/048/1595/front_fr.242.400.jpg",1],["https://images.openfoodfacts.org/images/products/304/692/002/2651/front_en.159.400.jpg",1],["https://images.openfoodfacts.org/images/products/506/004/264/1000/front_en.179.400.jpg",1],["https://images.openfoodfacts.org/images/products/762/221/058/4724/front_en.95.400.jpg",1],["https://images.openfoodfacts.org/images/products/304/692/002/2606/front_en.102.400.jpg",1],["https://images.openfoodfacts.org/images/products/322/982/010/0234/front_fr.246.400.jpg",1],["https://images.openfoodfacts.org/images/products/000/002/002/2464/front_en.301.400.jpg",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":50,"null_rate":0.0,"stats":{"cardinality":50,"entropy":5.643856189774725,"entropy_ratio":1.0000000000000002,"top_rate":0.02,"top_value":"https://images.openfoodfacts.org/images/products/611/124/210/0992/front_fr.172.400.jpg"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"sources","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"languages_hierarchy","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[],"column":"pnns_groups_1","extras":{"singletons":3,"top_values":[["Sugary snacks",38],["Salty snacks",4],["Cereals and potatoes",3],["unknown",2],["Milk and dairy products",1],["Beverages",1],["Fruits and vegetables",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":7,"null_rate":0.0,"stats":{"cardinality":7,"entropy":1.36033352951433,"entropy_ratio":0.4845605800770271,"top_rate":0.76,"top_value":"Sugary snacks"}},{"alerts":[],"column":"countries_lc","extras":{"singletons":3,"top_values":[["en",28],["fr",16],["es",2],["de",1],["it",1],["pl",1]]},"kind":"categorical","n":50,"n_null":1,"n_unique":6,"null_rate":0.02,"stats":{"cardinality":6,"entropy":1.5207111131435163,"entropy_ratio":0.5882913631123339,"top_rate":0.5714285714285714,"top_value":"en"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"additives_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"codes_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"countries_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"10 singleton categories"}],"column":"creator","extras":{"singletons":10,"top_values":[["openfoodfacts-contributors",23],["kiliweb",15],["javichu",2],["meryemali",1],["vichenze",1],["mllep",1],["andre",1],["sqoia",1],["shaolan",1],["tacite",1],["mambl",1],["norbert45fr",1],["date-limite-app",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":13,"null_rate":0.0,"stats":{"cardinality":13,"entropy":2.3509505113059426,"entropy_ratio":0.6353165273252817,"top_rate":0.46,"top_value":"openfoodfacts-contributors"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"ingredients","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"6 singleton categories"},{"code":"null_rate","level":"warn","message":"76.0% null"}],"column":"product_name_nl","extras":{"singletons":6,"top_values":[["",6],["Excellence 70% Cocoa Intense Dark",1],["Tartines craquantes multi-c\u00e9r\u00e9ales",1],["Dark absolute",1],["Nuts & Fruits Mix",1],["Granola",1],["Volkoren cracotte",1]]},"kind":"categorical","n":50,"n_null":38,"n_unique":7,"null_rate":0.76,"stats":{"cardinality":7,"entropy":2.292481250360578,"entropy_ratio":0.8165982976888231,"top_rate":0.5,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"ingredients_n_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"null_rate","level":"warn","message":"60.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_es","extras":{"singletons":0,"top_values":[["",20]]},"kind":"categorical","n":50,"n_null":30,"n_unique":1,"null_rate":0.6,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"90.0% null"}],"column":"product_name_pl","extras":{"singletons":2,"top_values":[["",3],["Czekolada gorzka 74%",1],["Excellence 70% Cocoa Intense Dark",1]]},"kind":"categorical","n":50,"n_null":45,"n_unique":3,"null_rate":0.9,"stats":{"cardinality":3,"entropy":1.3709505944546687,"entropy_ratio":0.8649735207179273,"top_rate":0.6,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"scores","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"36 singleton categories"}],"column":"brands","extras":{"singletons":36,"top_values":[["Lindt",4],["Gerbl\u00e9",3],["Excelo",3],["Henry's",2],["Pringles",2],["Perly",1],["LU",1],["\u0639\u0631\u0628\u064a",1],["J. D. Gross",1],["Cristaline",1],["Maruja",1],["Green & Black's",1],["Nutella",1],["wasa",1],["Tyrrell's",1],["Green and black",1],["Bjorg",1],["fin CARR\u00c9",1],["Wasa",1],["Henry\u2019s",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":41,"null_rate":0.0,"stats":{"cardinality":41,"entropy":5.213660689688186,"entropy_ratio":0.9731423391119923,"top_rate":0.08,"top_value":"Lindt"}},{"alerts":[{"code":"long_tail","level":"info","message":"15 singleton categories"},{"code":"null_rate","level":"warn","message":"60.0% null"}],"column":"ingredients_text_de","extras":{"singletons":15,"top_values":[["",5],["Kakaomasse, Kakaobutter, fettarmes Kakaopulver, Zucker, Vanille",1],["Kakaomasse, fettarmes Kakaopulver, Kakaobutter, Zucker, Emulgator: Lecithine (Soja); Vanilleextrakt.",1],["Nuss-Nugat-Creme 40 % (Zucker, Palm\u00f6l, _HASELN\u00dcSSE_ 13 %, _MAGERMILCHPULVER_ 8.7%, fettarmer Kakao 7,4 %, Emulgator Lecithine (_SOJA_), Vanillin), _WEIZENMEHL_ (32,5 %), pflanzliche Fette (Palm, Palmkern), Rohrzucker 8,5 % (enth\u00e4lt _WEIZEN_), _MILCHZUCKER_, _WEIZENKLEIE_, _VOLLMILCHPULVER_, _GERSTENMALZ_ - und Maisextraktpulver, Honig, Backtriebmittel: Dinatriumdiphosphat, Natriumhydrogencarbonat, Ammoniumhydrogencarbonat; fettarmer Kakao, Salz, _WEIZENST\u00c4RKE_, _GERSTENMALZMEHL_, Emulgator Lecithine (_SOJA_), Vanillin",1],["Kakaomasse, Zucker, Kakaobutter, Vanille",1],["Kartoffeln, Sonnenblumen\u00f6l, Meersalz.",1],["Kakaomasse, fettarmes Kakaopulver, Kakaobutter, Rohrzucker, Vanille. Kann Schalenfr\u00fcchte, Milch, Soja, Sesamsamen und Weizen enthalten.",1],["kakaomass of*, zucker, kakaobutter, kakaopulver stark ent\u00f6it, emulgator: sonnenblumenlecithine (e-322), nat\u00fcrliche in vanille-aroma, \r\n* rainforest alliance certified, \r\ncocoa: 74% mindestens,",1],["_WEIZENMEHL_, Palm\u00f6l, Glukosesirup, _GERSTENMALZEXTRAKT_, Backtriebmittel (Ammoniumcarbonate, Natriumcarbonate), Speisesalz 1,4 %, _EIER_, Aroma, Mehlbehandlungsmittel (_NATRIUMMETABISULFIT_).",1],["Kakaomasse, Zucker, Kakaobutter, Emulgator: Lecithine (_Soja_); Vanilleextrakt.",1],["Kartoffelp\u00fcreepulver, pflanzliche \u00d6le (Sonnenblume, Palm, Mais) in ver\u00e4nderlichen Gewichtsanteilen, Weizenmehl, Maismehl, Reismehl, Maltodextrin, Emulgator (E471), Salz, Farbstoff (Annatto Norbixin).",1],["Kakaomasse, fettarmes Kakaopulver, Kakaobutter . Kann Schalenfr\u00fcchte, Milch und Soja enthalten.",1],["Alpenmilch Schokolade.\nZutaten: Zucker, Kakaobutter, Magermilchpulver, Kakaomasse, S\u00fc\u00dfmolkenpulver (aus Milch), Butterreinfett, Haseln\u00fcsse, Emulgatoren (Sojalecithin, E476), Aroma. Kakao: 30 % mindestens.\nKann andere N\u00fcsse und Weizen enthalten.\nOhne Farbstoffe** und Konservierungsstoffe** -**Gem\u00e4\u00df rechtlicher Vorschriften.",1],["Kakaomasse\u00b9, Rohrzucker\u00b9, Kakaobutter\u00b9, Emulgator: Lecithine (_Soja_)\u00b9. \u00b9aus kontrolliert \u00f6kologischem Anbau.",1],["25% _Walnusskerne_, 25% _Mandeln_, 25% Sultaninen geschwefelt (Sultaninen, Sonnenblumen\u00f6l, Konservierungsstoff: _Schwefeldioxid_), 25% Cranberries (Cranberries, Zucker, Sonnenblumen\u00f6l).",1],["Kakaomasse, Zucker, Kakaobutter, Emulgator (Sojalecithin), Vanille. Kann Haseln\u00fcsse, Mandeln, Milch enthalten.",1]]},"kind":"categorical","n":50,"n_null":30,"n_unique":16,"null_rate":0.6,"stats":{"cardinality":16,"entropy":3.7414460711655217,"entropy_ratio":0.9353615177913804,"top_rate":0.25,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_nb","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"outliers","level":"warn","message":"48.8% rows beyond 1.5 IQR"}],"column":"packagings_n","extras":{"histogram":{"counts":[10,21,0,8,1,1],"edges":[1.0,1.6666666666666665,2.333333333333333,3.0,3.6666666666666665,4.333333333333333,5.0]},"sample":[1.0,2.0,2.0,3.0,2.0,3.0,1.0,2.0,1.0,2.0,2.0,2.0,1.0,1.0,2.0,2.0,3.0,1.0,1.0,1.0,2.0,1.0,2.0,2.0,4.0,5.0,3.0,2.0,2.0,3.0,3.0,2.0,1.0,2.0,2.0,3.0,2.0,2.0,2.0,2.0,3.0]},"kind":"numeric","n":50,"n_null":9,"n_unique":5,"null_rate":0.18,"stats":{"iqr":0.0,"kurtosis":1.6015493732434862,"max":5.0,"mean":2.073170731707317,"median":2.0,"min":1.0,"n_outliers":20,"outlier_rate":0.4878048780487805,"q1":2.0,"q3":2.0,"skew":0.9834026305155502,"std":0.8772184420781127,"zero_rate":0.0}},{"alerts":[],"column":"complete","extras":{"histogram":{"counts":[34,0,0,0,0,0,16],"edges":[0.0,0.14285714285714285,0.2857142857142857,0.42857142857142855,0.5714285714285714,0.7142857142857142,0.8571428571428571,1.0]},"sample":[0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":2,"null_rate":0.0,"stats":{"iqr":1.0,"kurtosis":-1.404411764705883,"max":1.0,"mean":0.32,"median":0.0,"min":0.0,"n_outliers":0,"outlier_rate":0.0,"q1":0.0,"q3":1.0,"skew":0.7717436331412896,"std":0.47121207149916117,"zero_rate":0.68}},{"alerts":[{"code":"long_tail","level":"info","message":"6 singleton categories"},{"code":"null_rate","level":"warn","message":"58.0% null"}],"column":"emb_codes_20141016","extras":{"singletons":6,"top_values":[["",15],["LINDT & SPR\u00dcNGLI SAS,CHOCOLADEFABRIKEN LINDT & SPR\u00dcNGLI AG",1],["EMB 44068A",1],["//HERSTELLER UND VERPACKER://,SOLENT GMBH & CO. KG,//DIE ZUGEH\u00d6RIGKEIT ZU://,SCHWARZ BETEILIGUNGS GMBH",1],["//FABRICANTE Y ENVASADOR://,LINDT & SPR\u00dcNGLI SAS,//PERTENECIENTE A://,CHOCOLADEFABRIKEN LINDT & SPR\u00dcNGLI AG",1],["//FABRICANTE Y ENVASADOR://,RAUSCH SCHOKOLADEN GMBH",1],["EMB 64422",1]]},"kind":"categorical","n":50,"n_null":29,"n_unique":7,"null_rate":0.58,"stats":{"cardinality":7,"entropy":1.6016812830583902,"entropy_ratio":0.570530384481797,"top_rate":0.7142857142857143,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"ingredients_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_ja","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"8 singleton categories"},{"code":"null_rate","level":"warn","message":"60.0% null"}],"column":"generic_name_de","extras":{"singletons":8,"top_values":[["",12],["Edelbitterschokolade 90% Kakao",1],["Kekse mit Nuss-Nougat-Creme-F\u00fcllung",1],["Extra feine dunkle Schokolade",1],["Edelbitter-Schokolade 74% Kakao",1],["Kr\u00e4cker",1],["Edel-Bitter-Schokolade. Ecuador 70% Kakao",1],["Nuss-Nugat-Creme",1],["Alpenmilch-Schokolade",1]]},"kind":"categorical","n":50,"n_null":30,"n_unique":9,"null_rate":0.6,"stats":{"cardinality":9,"entropy":2.170950594454669,"entropy_ratio":0.6848586617875467,"top_rate":0.6,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"19 singleton categories"}],"column":"last_editor","extras":{"singletons":19,"top_values":[["foodless",21],["municorn-calorie-counter-app",3],["charlesnepote",2],["macrofactor",2],["bodysupport",2],["moon-rabbit",1],["gmlaa",1],["prepperapp",1],["marmotte73",1],["laura-chaud",1],["org-barilla-france-sa",1],["tom1707",1],["bubu63",1],["moncoachigbas",1],["natrius",1],["clxtng",1],["roboto-app",1],["fgouget",1],["ludolm",1],["foodiq",1]]},"kind":"categorical","n":50,"n_null":1,"n_unique":24,"null_rate":0.02,"stats":{"cardinality":24,"entropy":3.512800591451587,"entropy_ratio":0.7661568858849049,"top_rate":0.42857142857142855,"top_value":"foodless"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"minerals_prev_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=-2.44"}],"column":"last_image_t","extras":{"histogram":{"counts":[2,0,0,0,5,17,26],"edges":[1639159016.0,1657518505.857143,1675877995.7142856,1694237485.5714285,1712596975.4285715,1730956465.2857144,1749315955.142857,1767675445.0]},"sample":[1767287564.0,1762497041.0,1766662029.0,1762902315.0,1736701553.0,1760023391.0,1754664712.0,1767381324.0,1735647179.0,1738059985.0,1735033991.0,1733053762.0,1766619585.0,1767675414.0,1755716320.0,1730578039.0,1722883884.0,1763672849.0,1761392846.0,1761564203.0,1767675445.0,1735241808.0,1735034216.0,1755432475.0,1766261975.0,1639306722.0,1719418009.0,1757677414.0,1735068633.0,1765741117.0,1764184766.0,1735338708.0,1766822100.0,1732383807.0,1741976090.0,1738313702.0,1639159016.0,1713918514.0,1745253202.0,1767514906.0,1733491222.0,1763720506.0,1764812562.0,1759483937.0,1767545777.0,1745732862.0,1749725510.0,1736072564.0,1726833790.0,1738151211.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":50,"null_rate":0.0,"stats":{"iqr":28956774.25,"kurtosis":7.36038843000579,"max":1767675445.0,"mean":1745146211.04,"median":1752195111.0,"min":1639159016.0,"n_outliers":2,"outlier_rate":0.04,"q1":1735111926.75,"q3":1764068701.0,"skew":-2.4427262292167367,"std":26812693.31109656,"zero_rate":0.0}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"obsolete_since_date","extras":{"singletons":0,"top_values":[["",44]]},"kind":"categorical","n":50,"n_null":6,"n_unique":1,"null_rate":0.12,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"pnns_groups_2_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"emb_codes_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"37 singleton categories"}],"column":"countries_beforescanbot","extras":{"singletons":37,"top_values":[["France",6],["Maroc",1],["Belgique,France,Polyn\u00e9sie fran\u00e7aise,Guadeloupe,Luxembourg,Portugal,La R\u00e9union",1],["Argelia,B\u00e9lgica,Rep\u00fablica Checa,Finlandia,Francia,Polinesia Francesa,Alemania,Italia,Mauricio,Marruecos,Pa\u00edses Bajos,Reuni\u00f3n,Singapur,Espa\u00f1a,Suecia,Suiza,Reino Unido",1],["en:Morocco",1],["nl:Duitsland,nl:Sloveni\u00eb,nl:Spanje,nl:Frankrijk",1],["Belgique,C\u00f4te d'Ivoire,France,Luxembourg,Mali,Martinique,Russie,Suisse,Royaume-Uni",1],["Alg\u00e9rie, Cameroun, France, Maroc, en:spain",1],["France,Su\u00e8de,Royaume-Uni",1],["France,Allemagne,Italie",1],["France,Italie,Espagne,Suisse",1],["\u010cesko,Francie,N\u011bmecko,Guadeloupe,It\u00e1lie,en:algerie,en:espagne,en:la-reunion,en:royaume-uni,en:suisse",1],["Belgique,France,Royaume-Uni",1],["Austria,France,Italy,R\u00e9union,Spain,Alemania,Belgica,Francia,Paises-bajos,Suiza",1],["Finland,France,Germany,Spain",1],["France,Guadeloupe,La R\u00e9union,Suisse,en:en",1],["en:fr",1],["Germany",1],["Australia, Belgium, Denmark, Estonia, France, Germany, Hungary, Italy, Lebanon, Portugal, Serbia, Spain, Switzerland, United Kingdom, en:nl",1],["Belgique,France,Pays-Bas,S\u00e9n\u00e9gal",1]]},"kind":"categorical","n":50,"n_null":7,"n_unique":38,"null_rate":0.14,"stats":{"cardinality":38,"entropy":5.065572312741006,"entropy_ratio":0.9652519589427557,"top_rate":0.13953488372093023,"top_value":"France"}},{"alerts":[],"column":"nutrition_grade_fr","extras":{"singletons":1,"top_values":[["e",27],["d",9],["c",7],["a",4],["b",2],["unknown",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":6,"null_rate":0.0,"stats":{"cardinality":6,"entropy":1.9126007492587709,"entropy_ratio":0.7398949689696431,"top_rate":0.54,"top_value":"e"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"data_quality_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[],"column":"ingredients_with_specified_percent_sum","extras":{"histogram":{"counts":[33,0,2,4,5,4,2],"edges":[0.0,14.228571428571428,28.457142857142856,42.68571428571428,56.91428571428571,71.14285714285714,85.37142857142857,99.6]},"sample":[0.0,54.5,0.0,41.6,78.4,0.0,0.0,0.0,0.0,0.0,0.0,0.0,70.1,0.0,0.0,0.0,0.0,0.0,57.0,0.0,7.0,0.0,3.4,0.0,0.0,0.0,99.6,84.3,0.0,0.0,29.1,0.0,63.0,77.6,0.0,53.0,11.0,65.0,0.0,0.0,0.0,3.0,0.0,50.0,70.0,73.0,0.0,0.0,48.0,98.5]},"kind":"numeric","n":50,"n_null":0,"n_unique":22,"null_rate":0.0,"stats":{"iqr":52.25,"kurtosis":-0.5856249010639578,"max":99.6,"mean":22.741999999999997,"median":0.0,"min":0.0,"n_outliers":0,"outlier_rate":0.0,"q1":0.0,"q3":52.25,"skew":0.9979114229555857,"std":32.88026571470169,"zero_rate":0.58}},{"alerts":[{"code":"null_rate","level":"warn","message":"68.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_it","extras":{"singletons":0,"top_values":[["",16]]},"kind":"categorical","n":50,"n_null":34,"n_unique":1,"null_rate":0.68,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[],"column":"nutrition_data_per","extras":{"singletons":0,"top_values":[["100g",42],["serving",8]]},"kind":"categorical","n":50,"n_null":0,"n_unique":2,"null_rate":0.0,"stats":{"cardinality":2,"entropy":0.6343095546405662,"entropy_ratio":0.6343095546405662,"top_rate":0.84,"top_value":"100g"}},{"alerts":[{"code":"null_rate","level":"warn","message":"90.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_pl","extras":{"singletons":0,"top_values":[["",5]]},"kind":"categorical","n":50,"n_null":45,"n_unique":1,"null_rate":0.9,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"product","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"27 singleton categories"}],"column":"link","extras":{"singletons":27,"top_values":[["",21],["www.copag.ma",1],["https://www.lu.fr/prince",1],["http://www.lindt.es/swf/spa/productos/excellence/altos-porcentajes/excellence-90/www.lindt.com",1],["https://www.gerble.fr/vitalite/biscuit-sesame",1],["https://www.nutella.com/de/de/produkte/nutella-biscuits",1],["http://www.wasa.fr/produits/tartines-croustillantes/authentique/pack/",1],["https://www.lindt.fr/excellence-noir-70",1],["https://www.tyrrellscrisps.co.uk/range/potato-crisps/lightly-sea-salted/",1],["https://www.lindt.fr/excellence-noir-85",1],["www.bjorg.fr",1],["https://www.wasa.fr",1],["www.henrys.ma",1],["https://www.tuc.eu/produkte_de_at#tuc-prod-4",1],["http://www.lindt.es/swf/spa/productos/excellence/altos-porcentajes/excellence-70/",1],["https://www.lepaindesfleurs.fr/la-marque",1],["https://www.gerble.fr/teneur-reduite/biscuit-pomme-noisette",1],["https://www.pringles.com/de/products/flavours/pringles-original-product.html",1],["http://www.lindt.ca/swf/fra/produits/excellence/barres/excellence-99-cacao/",1],["www.nestledessert.fr",1]]},"kind":"categorical","n":50,"n_null":2,"n_unique":28,"null_rate":0.04,"stats":{"cardinality":28,"entropy":3.663323628255448,"entropy_ratio":0.762024790690408,"top_rate":0.4375,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"8 singleton categories"},{"code":"null_rate","level":"warn","message":"76.0% null"}],"column":"ingredients_text_nl","extras":{"singletons":8,"top_values":[["",4],["Cacaomassa, cacaoboter, magere cacaopoeder, suiker.",1],["Aardappelen, zonnebloemolie, zeezout.",1],["Cacaomassa, magere cacao, cacaoboter, bruine suiker, vanille. Kan noten, melk, soja, sesamzaad en tarwe bevatten.",1],["Cacaomassa, suiker, cacaoboter, vanille.",1],["Cacaomassa, magere cacaopoeder, cacaoboter, bruine suiker.",1],["*Referentie inname van een gemiddelde volwassehe (8400 kJ/ 2000 ReJI), 16,7 g 46x4, www,snackmindful,com Milka www,milka,com ER Mondelez France SAS, 6 avenue R\u00e9aumur, CS 50014, 92142 Clamart Cedex, Service Consommateurs N\u00ba Cristal:09,69,39,79,79 BE Mondelez Belgium, Stationsstraat 100, 2800 Mechelen, ND Mondelez Nederland, Verlengde Poolseweg 34, 4818 CL Breda, eu mondelezinternational,com e 100 g COCOA LIFE www,cocoalife,org 8 FR FRANCE ONLY 05 pp 3 045140 105502",1],["_tarwebloem_ 47%, _melkchocolade_ 29% (suiker, cacaomassa, cacaoboter, weipoeder (van _melk_), magere _melkpoeder_, plantaardige vetten (shea, palm in wisselende verhoudingen), _melkvet_, emulgatoren (_sojalecithine_, E476), lactose (van _melk_), aroma), plantaardige oli\u00ebn (palm, kokos), suiker, suikerstroop, _tarwezemelen_, rijsmiddelen (natriumwaterstofcarbonaat, ammoniumwaterstofcarbonaat), zout, _tarwekiemen_, voedingszuur (citroenzuur)",1],["granen 98.3% (_volkorentarwemeel_ 65.8%, _roggebloem_, _tarwebloem_ 10.2%, rijstbloem, gemoute _tarwebloem_, _tarwegriesmeel_, boekweitbloem, _gerstebloem_), suiker, magere _melkpoeder_, zout, palmolie, _tarwekiemen_, emulgator (zonnebloemlecithine)",1]]},"kind":"categorical","n":50,"n_null":38,"n_unique":9,"null_rate":0.76,"stats":{"cardinality":9,"entropy":2.9182958340544896,"entropy_ratio":0.9206198357143051,"top_rate":0.3333333333333333,"top_value":""}},{"alerts":[],"column":"additives_n","extras":{"histogram":{"counts":[29,11,3,3,2,1,1],"edges":[0.0,1.1428571428571428,2.2857142857142856,3.4285714285714284,4.571428571428571,5.7142857142857135,6.857142857142857,8.0]},"sample":[0.0,3.0,0.0,0.0,4.0,1.0,0.0,2.0,1.0,0.0,0.0,2.0,5.0,0.0,0.0,0.0,0.0,0.0,2.0,1.0,0.0,2.0,6.0,3.0,0.0,4.0,0.0,2.0,0.0,1.0,1.0,2.0,2.0,2.0,0.0,1.0,4.0,2.0,1.0,0.0,3.0,0.0,1.0,0.0,1.0,2.0,8.0,2.0,5.0,0.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":8,"null_rate":0.0,"stats":{"iqr":2.0,"kurtosis":2.1046220800633053,"max":8.0,"mean":1.52,"median":1.0,"min":0.0,"n_outliers":2,"outlier_rate":0.04,"q1":0.0,"q3":2.0,"skew":1.4732170682059635,"std":1.8209663279003647,"zero_rate":0.4}},{"alerts":[{"code":"long_tail","level":"info","message":"4 singleton categories"},{"code":"null_rate","level":"warn","message":"92.0% null"}],"column":"generic_name_sv","extras":{"singletons":4,"top_values":[["Fin m\u00f6rk choklad med 90% kakao",1],["M\u00f6rk choklad",1],["",1],["Kex",1]]},"kind":"categorical","n":50,"n_null":46,"n_unique":4,"null_rate":0.92,"stats":{"cardinality":4,"entropy":2.0,"entropy_ratio":1.0,"top_rate":0.25,"top_value":"Fin m\u00f6rk choklad med 90% kakao"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"ingredients_that_may_be_from_palm_oil_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[],"column":"known_ingredients_n","extras":{"histogram":{"counts":[16,12,6,7,5,2,2],"edges":[0.0,5.142857142857143,10.285714285714286,15.42857142857143,20.571428571428573,25.714285714285715,30.85714285714286,36.0]},"sample":[4.0,19.0,5.0,8.0,22.0,7.0,1.0,9.0,8.0,4.0,0.0,26.0,34.0,4.0,4.0,3.0,5.0,5.0,14.0,9.0,6.0,20.0,17.0,12.0,4.0,19.0,3.0,22.0,5.0,6.0,8.0,14.0,12.0,14.0,3.0,7.0,24.0,20.0,10.0,16.0,21.0,0.0,5.0,9.0,6.0,16.0,36.0,22.0,26.0,14.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":22,"null_rate":0.0,"stats":{"iqr":13.5,"kurtosis":0.07410982999798543,"max":36.0,"mean":11.76,"median":9.0,"min":0.0,"n_outliers":0,"outlier_rate":0.0,"q1":5.0,"q3":18.5,"skew":0.8598171852923553,"std":8.721449046425011,"zero_rate":0.04}},{"alerts":[{"code":"outliers","level":"warn","message":"12.0% rows beyond 1.5 IQR"}],"column":"completeness","extras":{"histogram":{"counts":[3,3,2,2,22,9,9],"edges":[0.575,0.65,0.725,0.8,0.875,0.9500000000000001,1.0250000000000001,1.1]},"sample":[1.0625,0.9,0.8875,0.8,1.0,0.9875,1.1,0.7875,0.7875,0.9,0.5875,0.8875,0.9,0.9,0.9,1.0,0.9875,0.9,0.9,1.1,1.0,0.8875,0.6875,0.8875,0.8875,0.9875,1.0,1.1,0.675,1.1,0.8875,0.8875,0.8875,1.1,1.1,0.9875,0.85,0.9,1.1,1.1,0.575,0.5875,0.9,0.9,0.9,0.9,0.875,0.6875,1.0,0.8875]},"kind":"numeric","n":50,"n_null":0,"n_unique":14,"null_rate":0.0,"stats":{"iqr":0.11250000000000004,"kurtosis":0.320000659997818,"max":1.1,"mean":0.91,"median":0.9,"min":0.575,"n_outliers":6,"outlier_rate":0.12,"q1":0.8875,"q3":1.0,"skew":-0.6678261639637765,"std":0.13580823815593962,"zero_rate":0.0}},{"alerts":[{"code":"constant","level":"info","message":"only one distinct value"}],"column":"ingredients_sweeteners_n","extras":{"histogram":{"counts":[0,0,0,50,0,0,0],"edges":[-0.5,-0.35714285714285715,-0.2142857142857143,-0.07142857142857145,0.0714285714285714,0.2142857142857142,0.3571428571428571,0.5]},"sample":[0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":1,"null_rate":0.0,"stats":{"iqr":0.0,"kurtosis":0.0,"max":0.0,"mean":0.0,"median":0.0,"min":0.0,"n_outliers":0,"outlier_rate":0.0,"q1":0.0,"q3":0.0,"skew":0.0,"std":0.0,"zero_rate":1.0}},{"alerts":[],"column":"nova_groups","extras":{"singletons":1,"top_values":[["4",33],["3",14],["1",1]]},"kind":"categorical","n":50,"n_null":2,"n_unique":3,"null_rate":0.04,"stats":{"cardinality":3,"entropy":1.0064630247287516,"entropy_ratio":0.6350074681708949,"top_rate":0.6875,"top_value":"4"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"allergens_hierarchy","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"obsolete","extras":{"singletons":0,"top_values":[["",44]]},"kind":"categorical","n":50,"n_null":6,"n_unique":1,"null_rate":0.12,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"92.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_sv","extras":{"singletons":0,"top_values":[["",4]]},"kind":"categorical","n":50,"n_null":46,"n_unique":1,"null_rate":0.92,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"packaging_hierarchy","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[],"column":"ingredients_with_unspecified_percent_n","extras":{"histogram":{"counts":[22,13,6,7,1,0,1],"edges":[1.0,5.571428571428571,10.142857142857142,14.714285714285714,19.285714285714285,23.857142857142854,28.428571428571427,33.0]},"sample":[5.0,12.0,5.0,10.0,16.0,6.0,1.0,8.0,7.0,4.0,5.0,11.0,22.0,4.0,4.0,3.0,5.0,5.0,11.0,7.0,5.0,7.0,9.0,10.0,4.0,17.0,1.0,15.0,5.0,5.0,4.0,11.0,7.0,8.0,3.0,5.0,19.0,13.0,9.0,15.0,16.0,11.0,4.0,5.0,4.0,10.0,33.0,10.0,19.0,5.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":18,"null_rate":0.0,"stats":{"iqr":6.0,"kurtosis":3.545244444444444,"max":33.0,"mean":8.8,"median":7.0,"min":1.0,"n_outliers":2,"outlier_rate":0.04,"q1":5.0,"q3":11.0,"skew":1.6446666666666663,"std":6.0609152673132645,"zero_rate":0.0}},{"alerts":[{"code":"null_rate","level":"warn","message":"46.0% null"},{"code":"high_skew","level":"info","message":"skew=+4.90"}],"column":"fruits-vegetables-nuts_100g_estimate","extras":{"histogram":{"counts":[26,0,0,0,1],"edges":[0.0,17.0,34.0,51.0,68.0,85.0]},"sample":[0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,85.0,0.0,0.0,0.0,0.0]},"kind":"numeric","n":50,"n_null":23,"n_unique":2,"null_rate":0.46,"stats":{"iqr":0.0,"kurtosis":22.038461538461522,"max":85.0,"mean":3.1481481481481484,"median":0.0,"min":0.0,"n_outliers":1,"outlier_rate":0.037037037037037035,"q1":0.0,"q3":0.0,"skew":4.9029033784545994,"std":16.358257627039396,"zero_rate":0.9629629629629629}},{"alerts":[{"code":"long_tail","level":"info","message":"7 singleton categories"}],"column":"emb_codes","extras":{"singletons":7,"top_values":[["",35],["FSC-C021442",2],["FSC-C012484",2],["EMB 31250",2],["LPL.28.01.13",1],["EMB 44068A",1],["SOLENT GMBH & CO. KG,SCHWARZ BETEILIGUNGS GMBH",1],["200029-N4/7243",1],["EMB 64422",1],["FSC-C190426",1],["C-352-255-22-10",1]]},"kind":"categorical","n":50,"n_null":2,"n_unique":11,"null_rate":0.04,"stats":{"cardinality":11,"entropy":1.7198603008654514,"entropy_ratio":0.49715111916070204,"top_rate":0.7291666666666666,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"packagings","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"purchase_places_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"additives_original_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"50 singleton categories"}],"column":"image_front_url","extras":{"singletons":50,"top_values":[["https://images.openfoodfacts.org/images/products/611/124/210/0992/front_fr.172.400.jpg",1],["https://images.openfoodfacts.org/images/products/762/221/044/9283/front_en.605.400.jpg",1],["https://images.openfoodfacts.org/images/products/304/692/002/9759/front_en.492.400.jpg",1],["https://images.openfoodfacts.org/images/products/611/103/100/5064/front_fr.56.400.jpg",1],["https://images.openfoodfacts.org/images/products/317/568/001/1480/front_en.221.400.jpg",1],["https://images.openfoodfacts.org/images/products/000/002/099/5553/front_en.314.400.jpg",1],["https://images.openfoodfacts.org/images/products/326/884/000/1008/front_fr.422.400.jpg",1],["https://images.openfoodfacts.org/images/products/336/260/001/1044/front_fr.50.400.jpg",1],["https://images.openfoodfacts.org/images/products/842/519/771/2024/front_en.60.400.jpg",1],["https://images.openfoodfacts.org/images/products/762/221/057/8464/front_en.29.400.jpg",1],["https://images.openfoodfacts.org/images/products/611/125/934/3108/front_fr.25.400.jpg",1],["https://images.openfoodfacts.org/images/products/336/260/001/1228/front_fr.38.400.jpg",1],["https://images.openfoodfacts.org/images/products/800/050/031/0427/front_fr.488.400.jpg",1],["https://images.openfoodfacts.org/images/products/730/040/048/1595/front_fr.242.400.jpg",1],["https://images.openfoodfacts.org/images/products/304/692/002/2651/front_en.159.400.jpg",1],["https://images.openfoodfacts.org/images/products/506/004/264/1000/front_en.179.400.jpg",1],["https://images.openfoodfacts.org/images/products/762/221/058/4724/front_en.95.400.jpg",1],["https://images.openfoodfacts.org/images/products/304/692/002/2606/front_en.102.400.jpg",1],["https://images.openfoodfacts.org/images/products/322/982/010/0234/front_fr.246.400.jpg",1],["https://images.openfoodfacts.org/images/products/000/002/002/2464/front_en.301.400.jpg",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":50,"null_rate":0.0,"stats":{"cardinality":50,"entropy":5.643856189774725,"entropy_ratio":1.0000000000000002,"top_rate":0.02,"top_value":"https://images.openfoodfacts.org/images/products/611/124/210/0992/front_fr.172.400.jpg"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"data_quality_bugs_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"null_rate","level":"warn","message":"90.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_fi","extras":{"singletons":0,"top_values":[["",5]]},"kind":"categorical","n":50,"n_null":45,"n_unique":1,"null_rate":0.9,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"images","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"ingredients_analysis","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"92.0% null"}],"column":"ingredients_text_with_allergens_pl","extras":{"singletons":2,"top_values":[["",2],["Miazga kakaowa, cukier, t\u0142uszcz kakaowy, kakao w proszku o obni\u017conej zawarto\u015bci t\u0142uszczu, emulgator: lecytyny (<span class=\"allergen\">soja</span>); naturalny aromat waniliowy. Czekolada gorzka: masa kakaowa minimum 74 %. Mo\u017ce zawiera\u0107<span class=\"allergen\"> orzeszki ziemne</span>,<span class=\"allergen\"> orzechy</span>,<span class=\"allergen\"> mleko</span> i <span class=\"allergen\">gluten</span> (<span class=\"allergen\">pszenica</span>, \u017cyt j\u0119czmie\u0144,<span class=\"allergen\"> owies</span>, pszenica orkisz i pszenica khorosan).",1],["Miazga kakaowa, cukier, t\u0142uszcz kakaowy, wanilia.",1]]},"kind":"categorical","n":50,"n_null":46,"n_unique":3,"null_rate":0.92,"stats":{"cardinality":3,"entropy":1.5,"entropy_ratio":0.9463946303571862,"top_rate":0.5,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"15 singleton categories"},{"code":"null_rate","level":"warn","message":"60.0% null"}],"column":"product_name_de","extras":{"singletons":15,"top_values":[["",5],["Edelbitterschokolade Mild 90%",1],["Edelbitter mild 85%",1],["Knusprige Kekse mit einem cremigen Herz aus Nutella\u00ae",1],["Lightly Sea Salted",1],["85% kraftvoller schwarzer Kakao",1],["Noir intense 74%cacao",1],["Tuc Original",1],["Schokolade Ecuador Edelbitter 70% Cacao",1],["Nutella",1],["Bitter Extra Kraftig",1],["Schokolade (Alpenmilch Schokolade)",1],["Granatapfel Sauerkirsche Fruchtgummi",1],["Bio-Bitterschokolade 70%",1],["Nuss-Frucht-Mix",1],["Dark Milde Edelbitter Scholade 70%",1]]},"kind":"categorical","n":50,"n_null":30,"n_unique":16,"null_rate":0.6,"stats":{"cardinality":16,"entropy":3.7414460711655217,"entropy_ratio":0.9353615177913804,"top_rate":0.25,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_with_allergens_nb","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"68.0% null"}],"column":"packaging_text_it","extras":{"singletons":2,"top_values":[["",14],["Incarto esterno in carta da riciclare, Incarto interno in alluminio da riciclare.",1],["1 tubo C/PAP 85 da indifferenziata, 1 sigillo C/PAP 84 da indifferenziata, 1 tappo di plastica PP5 da riciclare.",1]]},"kind":"categorical","n":50,"n_null":34,"n_unique":3,"null_rate":0.68,"stats":{"cardinality":3,"entropy":0.6685644431995964,"entropy_ratio":0.42181719939456,"top_rate":0.875,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"11 singleton categories"},{"code":"null_rate","level":"warn","message":"68.0% null"}],"column":"product_name_it","extras":{"singletons":11,"top_values":[["",5],["Fondente Prodigioso 90% Cacao",1],["Croccanti biscotti con cuore cremoso di Nutella",1],["Excellence 85% Cacao Chocolat Noir Puissant Lindt % Lindt",1],["cioccolato fondente",1],["Original",1],["Excellence 70% Cocoa Fondente Intenso",1],["Cioccolato fondente",1],["Pringles classiche 175 gr",1],["Milka",1],["Mix di frutta secca",1],["Granola",1]]},"kind":"categorical","n":50,"n_null":34,"n_unique":12,"null_rate":0.68,"stats":{"cardinality":12,"entropy":3.274397470347699,"entropy_ratio":0.9133700756113953,"top_rate":0.3125,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"21 singleton categories"}],"column":"serving_quantity","extras":{"singletons":21,"top_values":[["100",7],["10",7],["20",3],["25",2],["42",2],["30",2],["23",1],["11.5",1],["1000",1],["13.8",1],["11.4",1],["18",1],["50",1],["85",1],["36",1],["40",1],["45",1],["8.4",1],["7.143",1],["58",1]]},"kind":"categorical","n":50,"n_null":6,"n_unique":27,"null_rate":0.12,"stats":{"cardinality":27,"entropy":4.321753063842526,"entropy_ratio":0.9089075318556188,"top_rate":0.1590909090909091,"top_value":"100"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"product_name_ja","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"4 singleton categories"},{"code":"null_rate","level":"warn","message":"92.0% null"}],"column":"ingredients_text_with_allergens_sv","extras":{"singletons":4,"top_values":[["kakaomassa, kakaosm\u00f6r, fettreducerat kakaopulver, socker, vanilj.",1],["kakaomassa, fettreducerat kakaopulver, kakaosm\u00f6r, socker, emulgeringsmedel (<span class=\"allergen\">sojalecitin</span>), vaniljextrakt. Minst 85 % kakao i chokladen. Kan inneh\u00e5lla sp\u00e5r av<span class=\"allergen\"> n\u00f6tter</span> och <span class=\"allergen\">mj\u00f6lk</span>.",1],["",1],["<span class=\"allergen\">VETEMJ\u00d6L</span>/<span class=\"allergen\">HVEDEMEL</span>, palmolja/-olie, glukossirap, maltextrakt fr\u00e5n <span class=\"allergen\">KORN</span>/<span class=\"allergen\">BYG</span>, bakpulver/h\u00e6vemidler (ammoniumkarbonater, natriumkarbonater), salt, <span class=\"allergen\">\u00c4GG</span>/<span class=\"allergen\">\u00c6G</span>/<span class=\"allergen\">EGG</span>, arom, mj\u00f6lbehandlingsmedel/melbehandlingsmiddel (<span class=\"allergen\">NATRIUMDISULFIT</span>).",1]]},"kind":"categorical","n":50,"n_null":46,"n_unique":4,"null_rate":0.92,"stats":{"cardinality":4,"entropy":2.0,"entropy_ratio":1.0,"top_rate":0.25,"top_value":"kakaomassa, kakaosm\u00f6r, fettreducerat kakaopulver, socker, vanilj."}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"allergens_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"46 singleton categories"}],"column":"ingredients_text_fr","extras":{"singletons":46,"top_values":[["",2],["Lait \u00e9cr\u00e9m\u00e9, cr\u00e8me, SUcre, ferments laciques",1],["C\u00e9r\u00e9ale 50 % (Farine de bl\u00e9 34,8 %, farine de bl\u00e9 complet 15,2 %), sucre, huiles v\u00e9g\u00e9tales (palme, colza), cacao maigre en poudre 4,5 %, sirop de glucose, amidon de bl\u00e9, poudres \u00e0 lever (carbonates d'ammonium, carbonates de sodium), \u00e9mulsifiant (l\u00e9cithines de soja), sel, lait \u00e9cr\u00e9m\u00e9 en poudre, perm\u00e9at de lactos\u00e9rum (de lait), ar\u00f4mes. Peut contenir \u0153uf.",1],["P\u00e2te de cacao, beurre de cacao, cacao maigre, sucre, vanille.",1],["Coffret fourr\u00e9 au cacao (41,6%) et \u00e0 la vanille (208) - Ingr\u00e9dients Farine de bl\u00e9, sucre, huile v\u00e9g\u00e9tale non hydrog\u00e9n\u00e9e (huile de palme), filtrat de lait, poudre de cacao \u00c9mulsifiant \u00e0 faible teneur en cacao (322) L\u00e9cithine de soja) Agent levant (5000) Sucre artificiel (vanilline) Sel Contient du lait, du bl\u00e9 (gluten) du soja",1],["Farine de bl\u00e9 57%, sucre de canne roux, huile de colza, s\u00e9same toast\u00e9 10,6%, germe de bl\u00e9 5,4%, farine compl\u00e8te de bl\u00e9 5,4%, ar\u00f4me naturel, magn\u00e9sium, \u00e9mulsifiant : l\u00e9cithines, poudres \u00e0 lever (tartrates de potassium, carbonates de sodium, carbonates d'ammonium), sel de mer, amidon de bl\u00e9, vitamines (E, PP, B6, B1, B9).",1],["P\u00e2te de cacao, cacao maigre en poudre, beurre de cacao, sucre, \u00e9mulsifiant : l\u00e9cithines (soja) ; extrait de vanille. Traces \u00e9ventuelles de fruits \u00e0 coque et de lait.",1],["Eau de source",1],["Farine de froment, sucre, graisse v\u00e9g\u00e9tale, sucre inverti, agents levants ( bicarbonate d'ammonium - bicarbonate de sodium), sel, arome.",1],["Sucre, graisse vegetale de palmiste hidrogen\u00e9e, Lait Enteir en poudre, Amandes, Cacao D\u00e9graiss\u00e9 en poudre, lactoserum en poudre, Emulsifiant L\u00e9cithine de soja, Ar\u00f4mes (Vainilline).",1],["\u062f\u0642\u064a\u0642\u0627\u0644\u0642\u0645\u062d\u060c\u0631\u0642\u0627\u0626\u0642 \u0627\u0644\u0634\u0648\u0643\u0648\u0644\u0627\u062a\u064720%[\u0639\u062c\u064a\u0646\u0629 \u0632\u064a\u062a \u0627\u0644\u0646\u062e\u0644\u0629.\u0627\u0644\u0643\u0627\u0643\u0627\u0648\u060c\u0633\u0643\u0631\u060c\u062f\u0643\u0633\u062a\u0631\u0648\u0632 \u0648 \u0645\u0633\u062a\u062d\u0644\u0628",1],["Farine de _froment_, sucre, graisse v\u00e9g\u00e9tale, noix de coco r\u00e2p\u00e9e, poudre de _lait_, poudre de _lactos\u00e9rum_, sucre inverti, agents levants (bicarbonate d'ammonium - bicarbonate de Sodium), sel, ar\u00f4mes.",1],["P\u00e2te \u00e0 tartiner aux NOISETTES et au cacao 40% (sucre, huile de palme, NOISETTES 13%**, LAIT \u00e9cr\u00e9m\u00e9 en poudre 8,7%**, cacao maigre 7,4%**, \u00e9mulsifiants : l\u00e9cithines [SOJA]; vanilline), farine de FROMENT 32,5%, graisses v\u00e9g\u00e9tales (palme, palmiste), sucre de canne (contient BLE) 8,5%, LACTOSE, son de BLE, LAIT en poudre, miel, poudres \u00e0 lever (diphosphate disodique, carbonate acide de sodium, carbonate acide d'ammonium), farine d'ORGE malt\u00e9, cacao maigre en poudre, sel, extrait en poudre de malt d'ORGE et de ma\u00efs, amidon de FROMENT, \u00e9mulsifiants: l\u00e9cithines [SOJA]; vanilline.",1],["Farine compl\u00e8te de SEIGLE (77 g*), farine de SEIGLE (28 g*), levure, sel. Peut contenir des traces de LUPIN, LAIT, MOUTARDE, GRAINES DE S\u00c9SAME et SOJA. *en g pour 100 g de produit.",1],["P\u00e2te de cacao, sucre, beurre de cacao, vanille.\r\n\r\nPeut contenir des fruits \u00e0 coque, du lait, du soja et des graines de s\u00e9same.",1],["p\u00e2te de cacao*, beurre de cacao*, cacao maigre en poudre*, sucre de canne*, extrait de vanille*, * ingr\u00e9dients issus de l'agriculture biologique",1],["P\u00e2te de cacao, cacao maigre, beurre de cacao, cassonade, vanille",1],["Farine de bl\u00e9* 41%, Chocolat noir* 22% (p\u00e2te de cacao*, sucre de canne&quot;, beurre de cacao&quot;), Sucre de canne* roux non raffin\u00e9, Farine compl\u00e8te de bl\u00e9* 16%, Huile de tournesol ol\u00e9ique*, Ar\u00f4me naturel de vanille, Lait \u00e9cr\u00e9m\u00e9 en poudre, Sel de mer, carbonates d'ammonium, carbonates de sodium, gomme d'acacia*, extraits de romarin* Peut contenir du soja, des \u0153ufs, des fruits \u00e0 coque, des graines de s\u00e9same et de la moutarde. *Ingr\u00e9dients biologiques.",1],["P\u00e2te de cacao, sucre, beurre de cacao, cacao maigre en poudre, \u00e9mulsifiant : l\u00e9cithines (_soja_), ar\u00f4me naturel de vanille.",1],["Farine compl\u00e8te de SEIGLE 59 g*, son de BL\u00c9 27 g*, flocons d'AVOINE 12 g*, GRAINES DE S\u00c9SAME 7,0 g*, germe de BL\u00c9, sel. *en g pour 100 g de produit fini. Peut contenir des traces de LUPIN, LAIT, MOUTARDE et SOJA.",1]]},"kind":"categorical","n":50,"n_null":2,"n_unique":47,"null_rate":0.04,"stats":{"cardinality":47,"entropy":5.543295834054491,"entropy_ratio":0.9979669030553475,"top_rate":0.041666666666666664,"top_value":""}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=+6.86"}],"column":"nutrition_score_beverage","extras":{"histogram":{"counts":[49,0,0,0,0,0,1],"edges":[0.0,0.14285714285714285,0.2857142857142857,0.42857142857142855,0.5714285714285714,0.7142857142857142,0.8571428571428571,1.0]},"sample":[0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":2,"null_rate":0.0,"stats":{"iqr":0.0,"kurtosis":45.020408163265344,"max":1.0,"mean":0.02,"median":0.0,"min":0.0,"n_outliers":1,"outlier_rate":0.02,"q1":0.0,"q3":0.0,"skew":6.857142857142859,"std":0.14142135623730948,"zero_rate":0.98}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"ingredients_ids_debug","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"nutrition_data","extras":{"singletons":0,"top_values":[["on",49]]},"kind":"categorical","n":50,"n_null":1,"n_unique":1,"null_rate":0.02,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"on"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_ja","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"4 singleton categories"}],"column":"packaging_text_en","extras":{"singletons":4,"top_values":[["",39],["1 plastic bottle to recycle\r\n1 plastic cap to recycle",1],["1 cardboard sleeve recyclable, 1 sheet of aluminium recyclable",1],["Terracycle. Please dispose of this pack responsibly. Find out more at www.terracycle.co.uk.",1],["cardboard (to recycle)\r\nfoil paper (to throw away)",1]]},"kind":"categorical","n":50,"n_null":7,"n_unique":5,"null_rate":0.14,"stats":{"cardinality":5,"entropy":0.6325278585247099,"entropy_ratio":0.2724149209949562,"top_rate":0.9069767441860465,"top_value":""}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=+4.24"},{"code":"outliers","level":"warn","message":"16.0% rows beyond 1.5 IQR"}],"column":"unknown_ingredients_n","extras":{"histogram":{"counts":[46,1,1,0,1,0,1],"edges":[0.0,1.8571428571428572,3.7142857142857144,5.571428571428571,7.428571428571429,9.285714285714286,11.142857142857142,13.0]},"sample":[1.0,0.0,0.0,8.0,0.0,0.0,0.0,0.0,0.0,0.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,13.0,0.0,0.0,0.0,0.0,3.0,0.0,0.0,0.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":6,"null_rate":0.0,"stats":{"iqr":0.0,"kurtosis":18.31940434832385,"max":13.0,"mean":0.66,"median":0.0,"min":0.0,"n_outliers":8,"outlier_rate":0.16,"q1":0.0,"q3":0.0,"skew":4.236444254420296,"std":2.255243323674763,"zero_rate":0.84}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"ingredients_from_palm_oil_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"labels_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"35 singleton categories"},{"code":"null_rate","level":"warn","message":"24.0% null"}],"column":"packaging_old_before_taxonomization","extras":{"singletons":35,"top_values":[["plastique",3],["fr:Film en plastique,paquet,fr:Etui en carton",1],["Papel de aluminio,Caja de cart\u00f3n,Carton,Karton,emballage,box cardboard,Aluminium wrap, en:card-box, en:foil-wrapper",1],["Carton,Sachets,20 biscuits en 4 sachets,packet,paquetes",1],["sl:PAP,fr:FSC mixte,Produkt,21 PAP",1],["Papier,aluminium",1],["Plastic",1],["Plastique,en:mixed plastic-packet,Enveloppe",1],["fr:Papier,Package paper,Paper recycling,papier,Enveloppe",1],["carton,aluminium,Emballage carton",1],["Sachet,Sous atmosph\u00e8re protectrice,en:mixed plastic-packet",1],["paper, foil",1],["papier aluminium,emballage carton",1],["fr:film plastique \u00e0 jeter,fr:\u00e9tui carton \u00e0 recycler, fr:Film en plastique",1],["papier,Enveloppe",1],["paper",1],["Kunststoff",1],["Papel de aluminio, Caja de cart\u00f3n, Carton, en:card-carton, en:aluminium-wrapper",1],["Carton,plastique",1],["4 sachets plastiques de 4 biscuits, Carton, fr:Film en plastique, fr:Etui en carton",1]]},"kind":"categorical","n":50,"n_null":12,"n_unique":36,"null_rate":0.24,"stats":{"cardinality":36,"entropy":5.122798894965602,"entropy_ratio":0.9908845667077253,"top_rate":0.07894736842105263,"top_value":"plastique"}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_nb","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"nutrition_grades_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"category_properties","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[],"column":"nutriscore_score","extras":{"histogram":{"counts":[8,5,7,13,12,2,2],"edges":[0.0,5.714285714285714,11.428571428571429,17.142857142857142,22.857142857142858,28.571428571428573,34.285714285714285,40.0]},"sample":[20.0,14.0,28.0,9.0,15.0,0.0,21.0,31.0,20.0,26.0,22.0,28.0,0.0,25.0,8.0,15.0,21.0,18.0,24.0,0.0,21.0,23.0,24.0,25.0,4.0,0.0,1.0,40.0,19.0,36.0,16.0,13.0,2.0,20.0,25.0,18.0,6.0,32.0,10.0,25.0,5.0,20.0,13.0,25.0,19.0,12.0,19.0,28.0,10.0]},"kind":"numeric","n":50,"n_null":1,"n_unique":28,"null_rate":0.02,"stats":{"iqr":15.0,"kurtosis":-0.5336500018772776,"max":40.0,"mean":17.46938775510204,"median":19.0,"min":0.0,"n_outliers":0,"outlier_rate":0.0,"q1":10.0,"q3":25.0,"skew":-0.16155636554197175,"std":9.906020982245106,"zero_rate":0.08163265306122448}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"packaging_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"37 singleton categories"}],"column":"labels_old","extras":{"singletons":37,"top_values":[["",9],["Triman, en:Sin gluten",1],["Bezglutenowy, Triman",1],["Point Vert, Fabriqu\u00e9 en France, Ar\u00f4mes naturels, Sans colorants, Sans huile de palme, Nutriscore, Nutriscore B, Triman",1],["\u0421\u043f\u0440\u0430\u0432\u0435\u0434\u043b\u0438\u0432\u0430 \u0442\u044a\u0440\u0433\u043e\u0432\u0438\u044f, \u0412\u0435\u0433\u0435\u0442\u0430\u0440\u0438\u0430\u043d\u0441\u043a\u043e, \u0412\u0435\u0433\u0430\u043d, Fairtrade cocoa, FSC, FSC Mix",1],["Triman, Sans Nitrates",1],["Point Vert, Fabriqu\u00e9 en Espagne, en:CE",1],["Fair trade, Organic, Vegetarian, EU Organic, Fairtrade International, Vegan, Soil Association Organic, The Vegan Society, Commerce \u00e9quitable",1],["Point Vert, Non-bio, Triman",1],["Sans conservateurs, Fabriqu\u00e9 en France, Triman",1],["Sans gluten, V\u00e9g\u00e9tarien, Sans ar\u00f4mes artificiels, V\u00e9g\u00e9talien, Assured Food Standards, Point Vert, Sans colorants artificiels, Sans exhausteur de go\u00fbt, Sans glutamate, en:Made-in-england, en:Terracycle",1],["Organic, Vegetarian, EU Organic, Fair trade, Non-EU Agriculture, Vegan, Fairtrade International, FR-BIO-01, FSC, FSC Mix, Green Dot, Max Havelaar, PL-EKO-07, Soil Association Organic, The Vegan Society",1],["Agriculture non UE, Fabriqu\u00e9 en Belgique, Fabriqu\u00e9 en France, Sans huile de palme, Triman",1],["Organic,EU Organic,Non-EU Agriculture,Certified B Corporation,EU Agriculture,EU/non-EU Agriculture,FR-BIO-01,No palm oil,Nutriscore,Nutriscore Grade D,Pure cocoa butter,AB Agriculture Biologique",1],["Fair trade, Vegetarian, Fairtrade International, Vegan, Pure cocoa butter, Rainforest Alliance, Commerce-equitable, Pur-beurre-de-cacao",1],["Source de fibres alimentaires,Point Vert,Riche en fibres,Triman,Emballage-recyclable",1],["Halal",1],["Vegetariano,Vegano,Punto Verde",1],["Commerce \u00e9quitable, Sans gluten, Bio, V\u00e9g\u00e9tarien, \u00c9pi barr\u00e9, Bio europ\u00e9en, Kascher, V\u00e9g\u00e9talien, Point Vert, Fabriqu\u00e9 en France, Nutriscore, Nutriscore A, The Vegan Society, AB Agriculture Biologique, Afdiag",1],["Peu ou pas de sucre, Peu de sucre, Pauvre ou sans sodium, Sans conservateurs, Agriculture non UE, All\u00e9g\u00e9 en sucre, Riche en vitamine E, Source de fibres alimentaires, Agriculture durable, Enrichi en vitamines, Agriculture UE, Agriculture UE/Non UE, Riche en fibres, Faible teneur en sodium, Fabriqu\u00e9 en France, Ar\u00f4mes naturels, Sans colorants, Sans colorants ou conservateurs, Sans huile de palme, Nutriscore, Nutriscore A, Riche en vitamine B1, Riche en vitamine B9, Source de vitamine B6, Sans \u00e9dulcorants, Farine de bl\u00e9 fran\u00e7ais, Triman",1]]},"kind":"categorical","n":50,"n_null":4,"n_unique":38,"null_rate":0.08,"stats":{"cardinality":38,"entropy":4.9033592383835165,"entropy_ratio":0.9343420285098469,"top_rate":0.1956521739130435,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"12 singleton categories"}],"column":"packaging_text","extras":{"singletons":12,"top_values":[["",36],["1 film en plastique \u00e0 recycler\r\n1 \u00e9tui en papier ondul\u00e9 \u00e0 recycler",1],["carton, plastique",1],["1 bouchon en plastique \u00e0 trier\r\n1 bouteille en plastique \u00e0 trier",1],["1 \u00e9tui en carton \u00e0 recycler\r\n1 feuille en aluminium \u00e0 recycler",1],["1 sachet plastique \u00e0 jeter",1],["1 \u00e9tui en carton \u001f \u00e0 recycler\r\n1 feuille en aluminium \u00e0 recycler",1],["LE TRI +FACILE + BAC DE TRI",1],["4 FILMS PLASTIQUE A JETER \r\n1 \u00c9TUI CARTON \u00c0 RECYCLER",1],["cardboard (to recycle)\r\nfoil paper (to throw away)",1],["FR LE TRI + FACILE \u00c9TUI 8+ SACHETS BAC DE TRI A consommer de pr\u00e9f\u00e9rence avant le : en France par et Sant\u00e9 S.A.S. 10:02 11914538 112 eCastelnaudary REVEL 30 04 2024",1],["Sachet, clip \u00e0 recycler",1],["2 sachets en plastique \u00e0 recycler\r\n1 bo\u00eete en carton \u00e0 recycler",1]]},"kind":"categorical","n":50,"n_null":2,"n_unique":13,"null_rate":0.04,"stats":{"cardinality":13,"entropy":1.7075187496394215,"entropy_ratio":0.4614367155526019,"top_rate":0.75,"top_value":""}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=-3.10"},{"code":"outliers","level":"warn","message":"8.0% rows beyond 1.5 IQR"}],"column":"ingredients_percent_analysis","extras":{"histogram":{"counts":[4,0,0,0,0,0,46],"edges":[-1.0,-0.7142857142857143,-0.4285714285714286,-0.1428571428571429,0.1428571428571428,0.4285714285714284,0.7142857142857142,1.0]},"sample":[1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,-1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,-1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,-1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,-1.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":2,"null_rate":0.0,"stats":{"iqr":0.0,"kurtosis":7.5869565217391255,"max":1.0,"mean":0.84,"median":1.0,"min":-1.0,"n_outliers":4,"outlier_rate":0.08,"q1":1.0,"q3":1.0,"skew":-3.0962810792528392,"std":0.5480950312357393,"zero_rate":0.0}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"ecoscore_data","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"4 singleton categories"},{"code":"null_rate","level":"warn","message":"92.0% null"}],"column":"ingredients_text_sv","extras":{"singletons":4,"top_values":[["kakaomassa, kakaosm\u00f6r, fettreducerat kakaopulver, socker, vanilj.",1],["kakaomassa, fettreducerat kakaopulver, kakaosm\u00f6r, socker, emulgeringsmedel (_sojalecitin_), vaniljextrakt. Minst 85 % kakao i chokladen. Kan inneh\u00e5lla sp\u00e5r av n\u00f6tter och mj\u00f6lk.",1],["",1],["_VETEMJ\u00d6L_/_HVEDEMEL_, palmolja/-olie, glukossirap, maltextrakt fr\u00e5n _KORN_/_BYG_, bakpulver/h\u00e6vemidler (ammoniumkarbonater, natriumkarbonater), salt, _\u00c4GG_/_\u00c6G_/_EGG_, arom, mj\u00f6lbehandlingsmedel/melbehandlingsmiddel (_NATRIUMDISULFIT_).",1]]},"kind":"categorical","n":50,"n_null":46,"n_unique":4,"null_rate":0.92,"stats":{"cardinality":4,"entropy":2.0,"entropy_ratio":1.0,"top_rate":0.25,"top_value":"kakaomassa, kakaosm\u00f6r, fettreducerat kakaopulver, socker, vanilj."}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"brands_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"28 singleton categories"}],"column":"compared_to_category","extras":{"singletons":28,"top_values":[["en:dark-chocolate-bar-with-more-than-70-cocoa",5],["en:biscuits",4],["en:extra-fine-dark-chocolates",3],["en:dark-chocolates",3],["en:snacks-sucres",3],["en:sandwich-biscuits",2],["en:extruded-crispbreads",2],["en:plain-fermented-dairy-desserts-with-cream",1],["en:chocolate-stuffed-wafers",1],["en:spring-waters",1],["en:food",1],["en:drop-cookies",1],["en:shortbread-cookie-with-coconut",1],["en:biscuits-cookies-shelf-stable",1],["en:crispbreads",1],["fr:chips-de-pommes-de-terre-classiques",1],["en:dark-chocolate-bar",1],["en:cacao-et-derives",1],["en:crispbreads-wholemeal",1],["en:biscuit-snack-with-chocolate-filling",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":35,"null_rate":0.0,"stats":{"cardinality":35,"entropy":4.886370130156181,"entropy_ratio":0.9526419411862624,"top_rate":0.1,"top_value":"en:dark-chocolate-bar-with-more-than-70-cocoa"}},{"alerts":[{"code":"long_tail","level":"info","message":"39 singleton categories"}],"column":"data_sources","extras":{"singletons":39,"top_values":[["App - yuka, Apps, App - Open Food Facts, App - smoothie-openfoodfacts",4],["App - yuka, Apps, App - smoothie-openfoodfacts",3],["App - yuka, Apps, App - InFood, App - Open Food Facts, App - smoothie-openfoodfacts, App - macrofactor",2],["App - Yuka, Apps, App - smoothie-openfoodfacts",2],["App - yuka, Apps, App - Open Food Facts, App - smoothie-openfoodfacts, App - allergytracker, App - openfoodfactsflutterapp",1],["App - yuka, Apps, App - InFood, App - Open Food Facts, App - Horizon, App - smoothie-openfoodfacts, App - halal-healthy, App - foodwasteieee, App - mon-coach-ig-bas, App - intolerapp, App - fooducate",1],["Database - FoodRepo / openfood.ch, Databases, App - yuka, Apps, App - Horizon, App - InFood, App - Open Food Facts, App - smoothie-openfoodfacts, App - mon-coach-ig-bas, App - macrofactor, App - caloriecounterapp, App - Speisekammer",1],["App - smoothie-openfoodfacts, Apps",1],["App - yuka, Apps, App - InFood, App - Open Food Facts, App - smoothie-openfoodfacts, App - Waistline",1],["App - elcoco, App - yuka, Apps, App - off, App - El CoCo, App - InFood, App - Open Food Facts, App - Speisekammer, App - smoothie-openfoodfacts, App - macrofactor, App - mon-coach-ig-bas, App - caloriecounterapp",1],["App - yuka, Apps, App - ethic-advisor, App - InFood, App - Open Food Facts, App - smoothie-openfoodfacts, Producers, Producer - gie-sources-alma, Database - Equadis, Database - GDSN, Databases",1],["App - yuka, Apps, App - InFood, App - Open Food Facts, App - halal-healthy, App - smoothie-openfoodfacts",1],["Producer - Ferrero, Producers, App - off, App - yuka, Apps, Producer - ferrero-france-commerciale, Database - Equadis, Database - GDSN, Databases, App - Horizon, App - InFood, App - Open Food Facts, App - Speisekammer, App - smoothie-openfoodfacts, App - El CoCo, App - mon-coach-ig-bas, App - intolerapp, App - macrofactor, App - caloriecounterapp",1],["Database - FoodRepo / openfood.ch, Databases, App - yuka, Apps, App - ethic-advisor, Producers, Producer - barilla, Producer - barilla-france-sa, Database - Equadis, Database - GDSN, App - Open Food Facts, App - smoothie-openfoodfacts, App - mon-coach-ig-bas, App - InFood, App - caloriecounterapp",1],["Database - FoodRepo / openfood.ch, Databases, App - off, Apps, App - InFood, App - Open Food Facts, App - Yuka, App - smoothie-openfoodfacts, App - mon-coach-ig-bas, App - macrofactor",1],["Database - FoodRepo / openfood.ch, Databases, App - yuka, Apps, App - Horizon, App - InFood, App - Open Food Facts, App - smoothie-openfoodfacts, App - macrofactor, App - Speisekammer",1],["App - yuka, Apps, App - InFood, App - Open Food Facts, App - smoothie-openfoodfacts, App - caloriecounterapp, App - macrofactor",1],["Database - FoodRepo / openfood.ch, Databases, App - yuka, Apps, app-elcoco, App - InFood, App - Open Food Facts, App - smoothie-openfoodfacts, App - mon-coach-ig-bas",1],["App - yuka, Apps, App - Open Food Facts, App - InFood, App - smoothie-openfoodfacts",1],["App - yuka, Apps, App - Horizon, App - InFood, App - Open Food Facts, App - smoothie-openfoodfacts, App - macrofactor, App - caloriecounterapp",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":43,"null_rate":0.0,"stats":{"cardinality":43,"entropy":5.308758439731457,"entropy_ratio":0.9783448983264562,"top_rate":0.08,"top_value":"App - yuka, Apps, App - Open Food Facts, App - smoothie-openfoodfacts"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"other_nutritional_substances_prev_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"outliers","level":"warn","message":"15.2% rows beyond 1.5 IQR"}],"column":"ingredients_from_palm_oil_n","extras":{"histogram":{"counts":[39,0,0,0,0,7],"edges":[0.0,0.16666666666666666,0.3333333333333333,0.5,0.6666666666666666,0.8333333333333333,1.0]},"sample":[0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0]},"kind":"numeric","n":50,"n_null":4,"n_unique":2,"null_rate":0.08,"stats":{"iqr":0.0,"kurtosis":1.750915750915751,"max":1.0,"mean":0.15217391304347827,"median":0.0,"min":0.0,"n_outliers":7,"outlier_rate":0.15217391304347827,"q1":0.0,"q3":0.0,"skew":1.9367281045401676,"std":0.36315844747302034,"zero_rate":0.8478260869565217}},{"alerts":[{"code":"outliers","level":"warn","message":"12.0% rows beyond 1.5 IQR"}],"column":"last_updated_t","extras":{"histogram":{"counts":[3,1,1,2,3,8,32],"edges":[1738813895.0,1743075298.5714285,1747336702.142857,1751598105.7142856,1755859509.2857144,1760120912.857143,1764382316.4285715,1768643720.0]},"sample":[1768557199.0,1762997306.0,1768540604.0,1768504085.0,1757883911.0,1767814111.0,1761570954.0,1768001556.0,1745147085.0,1751977023.0,1767353907.0,1738845211.0,1768042908.0,1767757809.0,1759572852.0,1767705743.0,1760267634.0,1766162622.0,1761393049.0,1762240662.0,1768643720.0,1738845015.0,1764601816.0,1767819312.0,1768137111.0,1767437745.0,1768380967.0,1764429510.0,1748385396.0,1767521360.0,1767603669.0,1764175241.0,1768556517.0,1759747781.0,1767601341.0,1762163269.0,1764945307.0,1767183580.0,1767096588.0,1767515080.0,1764511895.0,1767722174.0,1766330181.0,1761737635.0,1767728546.0,1766831716.0,1768494060.0,1738813895.0,1765376778.0,1755204544.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":50,"null_rate":0.0,"stats":{"iqr":6137869.0,"kurtosis":2.8919560817570966,"max":1768643720.0,"mean":1762877559.6,"median":1766580948.5,"min":1738813895.0,"n_outliers":6,"outlier_rate":0.12,"q1":1761612624.25,"q3":1767750493.25,"skew":-1.94451555669091,"std":8037174.231112242,"zero_rate":0.0}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 98.0% of rows"}],"column":"nutrition_score_debug","extras":{"singletons":1,"top_values":[["",49],["missing saturated-fat_100g - missing sugars_100g - missing sodium_100g",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":2,"null_rate":0.0,"stats":{"cardinality":2,"entropy":0.14144054254182067,"entropy_ratio":0.14144054254182067,"top_rate":0.98,"top_value":""}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=-2.67"},{"code":"outliers","level":"warn","message":"10.0% rows beyond 1.5 IQR"}],"column":"popularity_key","extras":{"histogram":{"counts":[5,0,0,0,0,0,45],"edges":[22999500355.0,23142427771.285713,23285355187.57143,23428282603.857143,23571210020.142857,23714137436.42857,23857064852.714287,23999992269.0]},"sample":[23999992269.0,23999951062.0,23999951057.0,23999950898.0,23999950833.0,23999950735.0,23999950733.0,23999900678.0,23999900649.0,23999900619.0,23999900611.0,23999900600.0,22999950574.0,23999900569.0,23999900563.0,23999900536.0,23999900527.0,23999900528.0,23999500514.0,23999500507.0,23999500485.0,23999500478.0,23999500459.0,23999500457.0,22999900447.0,23999500429.0,23999500421.0,23999500423.0,23999500402.0,23999500402.0,23999500398.0,22999900382.0,23999500393.0,23999500379.0,23999500372.0,23999500369.0,23999500365.0,23999500362.0,23999500364.0,23999500368.0,23999500350.0,23999500359.0,22999500356.0,22999500355.0,23999500346.0,23999500338.0,23999500336.0,23999500337.0,23999500323.0,23999500325.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":49,"null_rate":0.0,"stats":{"iqr":400207.75,"kurtosis":5.111106271503699,"max":23999992269.0,"mean":23899669332.84,"median":23999500422.0,"min":22999500355.0,"n_outliers":5,"outlier_rate":0.1,"q1":23999500359.75,"q3":23999900567.5,"skew":-2.666664777235245,"std":303018530.3565228,"zero_rate":0.0}},{"alerts":[{"code":"long_tail","level":"info","message":"16 singleton categories"},{"code":"null_rate","level":"warn","message":"60.0% null"}],"column":"product_name_es","extras":{"singletons":16,"top_values":[["",4],["Pr\u00edncipe Galletas de Chocolate",1],["Excellence chocolate 90% cacao",1],["Chocolate negro 85% cacao",1],["Nutella Biscuits",1],["Biscotes integrales original",1],["Excellence 85% cacao",1],["Chocolate negro 74% cacao",1],["Tostadas crujientes de fibra",1],["Original",1],["Excellence 70% Cocoa Intense Dark",1],["Chocolate negro Ecuador 70% cacao",1],["Nutella",1],["Crunchy Oats & Honey",1],["Excellence 99% Cacao Noir Absolu",1],["Chocolate Con Leche Milka",1],["Excellence suave 70% cacao",1]]},"kind":"categorical","n":50,"n_null":30,"n_unique":17,"null_rate":0.6,"stats":{"cardinality":17,"entropy":3.9219280948873623,"entropy_ratio":0.9595018345628946,"top_rate":0.2,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"30 singleton categories"}],"column":"allergens_from_user","extras":{"singletons":30,"top_values":[["(fr) ",8],["(en) ",7],["(fr) en:gluten",3],["(en) en:soybeans, en:soybeans",2],["(en) en:banana,en:milk",1],["(en) Eggs,Gluten,Milk,Soybeans, en:milk",1],["(fr) Gluten,Lait,Soja, en:gluten",1],["(en) en:milk,en:nuts,en:soybeans",1],["(fr) Gluten,Lait",1],["(es) en:gluten,en:milk,en:nuts,en:soybeans",1],["(en) en:gluten,en:milk,en:soybeans",1],["(fr) en:gluten,en:sesame-seeds",1],["(fr) Gluten",1],["(fr) en:gluten,en:milk,en:soybeans",1],["(de) en:eggs,en:gluten,en:sulphur-dioxide-and-sulphites",1],["(en) en:gluten,en:nuts",1],["(fr) en:soybeans",1],["(en) en:milk,en:nuts,en:soybeans, en:soybeans",1],["(it) en:gluten",1],["(es) ",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":34,"null_rate":0.0,"stats":{"cardinality":34,"entropy":4.635728750643391,"entropy_ratio":0.9112064098150886,"top_rate":0.16,"top_value":"(fr) "}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"informers","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"26 singleton categories"},{"code":"null_rate","level":"warn","message":"32.0% null"}],"column":"brands_old","extras":{"singletons":26,"top_values":[["Gerbl\u00e9",3],["Lindt",3],["Green & Black's",2],["LuMondelez",1],["Lindt & spr\u00fcngli (nordic)",1],["J.D. Gross",1],["Cristaline",1],["Maruja",1],["Wasa,Barilla",1],["Tyrrell's",1],["Bjorg",1],["Fin Carr\u00e9",1],["Wasa",1],["Le pain des Fleurs,Ekibio",1],["Aperitivos company",1],["Lidl,J.D. Gross",1],["Nutella,Ferrero",1],["Pringles",1],["Nature Valley",1],["Lindt,\u0e25\u0e34\u0e19\u0e14\u0e4c",1]]},"kind":"categorical","n":50,"n_null":16,"n_unique":29,"null_rate":0.32,"stats":{"cardinality":29,"entropy":4.748940047005429,"entropy_ratio":0.9775542662205743,"top_rate":0.08823529411764706,"top_value":"Gerbl\u00e9"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"data_quality_errors_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"50 singleton categories"}],"column":"ingredients_text","extras":{"singletons":50,"top_values":[["milk cream, cream, sugar, banana, bacteria",1],["C\u00e9r\u00e9ale 50 % (Farine de bl\u00e9 34,8 %, farine de bl\u00e9 complet 15,2 %), sucre, huiles v\u00e9g\u00e9tales (palme, colza), cacao maigre en poudre 4,5 %, sirop de glucose, amidon de bl\u00e9, poudres \u00e0 lever (carbonates d'ammonium, carbonates de sodium), \u00e9mulsifiant (l\u00e9cithines de soja), sel, lait \u00e9cr\u00e9m\u00e9 en poudre, perm\u00e9at de lactos\u00e9rum (de lait), ar\u00f4mes. Peut contenir \u0153uf.",1],["P\u00e2te de cacao, beurre de cacao, cacao maigre, sucre, vanille.",1],["Coffret fourr\u00e9 au cacao (41,6%) et \u00e0 la vanille (208) - Ingr\u00e9dients Farine de bl\u00e9, sucre, huile v\u00e9g\u00e9tale non hydrog\u00e9n\u00e9e (huile de palme), filtrat de lait, poudre de cacao \u00c9mulsifiant \u00e0 faible teneur en cacao (322) L\u00e9cithine de soja) Agent levant (5000) Sucre artificiel (vanilline) Sel Contient du lait, du bl\u00e9 (gluten) du soja",1],["Farine de bl\u00e9 57%, sucre de canne roux, huile de colza, s\u00e9same toast\u00e9 10,6%, germe de bl\u00e9 5,4%, farine compl\u00e8te de bl\u00e9 5,4%, ar\u00f4me naturel, magn\u00e9sium, \u00e9mulsifiant : l\u00e9cithines, poudres \u00e0 lever (tartrates de potassium, carbonates de sodium, carbonates d'ammonium), sel de mer, amidon de bl\u00e9, vitamines (E, PP, B6, B1, B9).",1],["\u041a\u0430\u043a\u0430\u043e\u0432\u0430 \u043c\u0430\u0441\u0430, \u043d\u0438\u0441\u043a\u043e\u043c\u0430\u0441\u043b\u0435\u043d\u043e \u043a\u0430\u043a\u0430\u043e \u043d\u0430 \u043f\u0440\u0430\u0445, \u043a\u0430\u043a\u0430\u043e\u0432\u043e \u043c\u0430\u0441\u043b\u043e, \u0437\u0430\u0445\u0430\u0440, \u0435\u043c\u0443\u043b\u0433\u0430\u0442\u043e\u0440: \u043b\u0435\u0446\u0438\u0442\u0438\u043d (\u0441\u043e\u0435\u0432\u0438), \u0435\u043a\u0441\u0442\u0440\u0430\u043a\u0442 \u043e\u0442 \u0432\u0430\u043d\u0438\u043b\u0438\u044f, \u041c\u043e\u0436\u0435 \u0434\u0430 \u0441\u044a\u0434\u044a\u0440\u0436\u0430 \u0441\u043b\u0435\u0434\u0438 \u043e\u0442 \u044f\u0434\u043a\u0438 \u0438 \u043c\u043b\u044f\u043a\u043e,",1],["Eau de source",1],["Farine de froment, sucre, graisse v\u00e9g\u00e9tale, sucre inverti, agents levants ( bicarbonate d'ammonium - bicarbonate de sodium), sel, arome.",1],["sugar, cocoa butter, whole milk powder, cocoa mass, almonds, emulsifier (soya lecithin), flavoring",1],["cocoa mass #, cane sugar #, cocoa butter #, vanilla extract #, may contain nuts, milk,",1],["\u062f\u0642\u064a\u0642\u0627\u0644\u0642\u0645\u062d\u060c\u0631\u0642\u0627\u0626\u0642 \u0627\u0644\u0634\u0648\u0643\u0648\u0644\u0627\u062a\u064720%[\u0639\u062c\u064a\u0646\u0629 \u0632\u064a\u062a \u0627\u0644\u0646\u062e\u0644\u0629.\u0627\u0644\u0643\u0627\u0643\u0627\u0648\u060c\u0633\u0643\u0631\u060c\u062f\u0643\u0633\u062a\u0631\u0648\u0632 \u0648 \u0645\u0633\u062a\u062d\u0644\u0628",1],["Farine de _froment_, sucre, graisse v\u00e9g\u00e9tale, noix de coco r\u00e2p\u00e9e, poudre de _lait_, poudre de _lactos\u00e9rum_, sucre inverti, agents levants (bicarbonate d'ammonium - bicarbonate de Sodium), sel, ar\u00f4mes.",1],["P\u00e2te \u00e0 tartiner aux NOISETTES et au cacao 40% (sucre, huile de palme, NOISETTES 13%**, LAIT \u00e9cr\u00e9m\u00e9 en poudre 8,7%**, cacao maigre 7,4%**, \u00e9mulsifiants : l\u00e9cithines [SOJA]; vanilline), farine de FROMENT 32,5%, graisses v\u00e9g\u00e9tales (palme, palmiste), sucre de canne (contient BLE) 8,5%, LACTOSE, son de BLE, LAIT en poudre, miel, poudres \u00e0 lever (diphosphate disodique, carbonate acide de sodium, carbonate acide d'ammonium), farine d'ORGE malt\u00e9, cacao maigre en poudre, sel, extrait en poudre de malt d'ORGE et de ma\u00efs, amidon de FROMENT, \u00e9mulsifiants: l\u00e9cithines [SOJA]; vanilline.",1],["Farine compl\u00e8te de SEIGLE (77 g*), farine de SEIGLE (28 g*), levure, sel. Peut contenir des traces de LUPIN, LAIT, MOUTARDE, GRAINES DE S\u00c9SAME et SOJA. *en g pour 100 g de produit.",1],["P\u00e2te de cacao, sucre, beurre de cacao, vanille.\r\n\r\nPeut contenir des fruits \u00e0 coque, du lait, du soja et des graines de s\u00e9same.",1],["Kartoffeln, Sonnenblumen\u00f6l, Meersalz.",1],["p\u00e2te de cacao*, beurre de cacao*, cacao maigre en poudre*, sucre de canne*, extrait de vanille*, * ingr\u00e9dients issus de l'agriculture biologique",1],["P\u00e2te de cacao, cacao maigre, beurre de cacao, cassonade, vanille",1],["Farine de bl\u00e9* 41%, Chocolat noir* 22% (p\u00e2te de cacao*, sucre de canne&quot;, beurre de cacao&quot;), Sucre de canne* roux non raffin\u00e9, Farine compl\u00e8te de bl\u00e9* 16%, Huile de tournesol ol\u00e9ique*, Ar\u00f4me naturel de vanille, Lait \u00e9cr\u00e9m\u00e9 en poudre, Sel de mer, carbonates d'ammonium, carbonates de sodium, gomme d'acacia*, extraits de romarin* Peut contenir du soja, des \u0153ufs, des fruits \u00e0 coque, des graines de s\u00e9same et de la moutarde. *Ingr\u00e9dients biologiques.",1],["cocoa mass, sugar, cocoa butter, fat reduced cocoa powder, emulsifier: lecithins (soya), natural vanilla flavouring, dark chocolate contains: cocoa solids 74% minimum,",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":50,"null_rate":0.0,"stats":{"cardinality":50,"entropy":5.643856189774725,"entropy_ratio":1.0000000000000002,"top_rate":0.02,"top_value":"milk cream, cream, sugar, banana, bacteria"}},{"alerts":[{"code":"long_tail","level":"info","message":"43 singleton categories"}],"column":"categories","extras":{"singletons":43,"top_values":[["Snacks,Snacks sucr\u00e9s,Cacao et d\u00e9riv\u00e9s,Chocolats,Chocolats noirs,Chocolat noir en tablette extra d\u00e9gustation \u00e0 70% de cacao minimum",3],["Snacks,Snacks sucr\u00e9s,Biscuits et g\u00e2teaux,Biscuits sucr\u00e9s & biscuits ap\u00e9ritifs,Biscuits",2],["Snacks,Sweet snacks,Cocoa and its products,Chocolates,Dark chocolates",2],["Dairies,Fermented foods,Fermented milk products,Snacks,Desserts,Dairy desserts,Fermented dairy desserts,Plain fermented dairy desserts,Plain fermented dairy desserts with cream",1],["Snacks,Breakfasts,Sweet snacks,Biscuits and cakes,Biscuits and crackers,Sandwich biscuits",1],["Snacks,Snacks sucr\u00e9s,Cacao et d\u00e9riv\u00e9s,Chocolats,Chocolats noirs,Chocolats noirs en tablette,Chocolats noirs extra fin",1],["Snacks sucr\u00e9s,Biscuits et g\u00e2teaux,Gaufrettes fourr\u00e9es au chocolat",1],["Boissons et pr\u00e9parations de boissons,Boissons,Snacks,Eaux,Eaux de sources",1],["Snacks,Snacks sucr\u00e9s,Biscuits et g\u00e2teaux,Biscuits",1],["Snacks,Sweet snacks,Cocoa and its products,Confectioneries,Chocolates,Compound chocolates,Food",1],["Snacks,Sweet snacks,Biscuits and cakes,Biscuits and crackers,Biscuits,Drop cookies",1],["Snacks,Snacks sucr\u00e9s,Biscuits et g\u00e2teaux,Biscuits,Biscuits sabl\u00e9s,Sabl\u00e9s \u00e0 la noix de coco",1],["Botanas,Snacks dulces,Galletas y pasteles,en:Biscuits and crackers,Galletas,en:Biscuits/Cookies (Shelf Stable),fr:Biscoitos recheados",1],["Aliments d'origine v\u00e9g\u00e9tale,Snacks,C\u00e9r\u00e9ales et pommes de terre,Pains,Pains croustillants,Petit-d\u00e9jeuners",1],["Produits ferment\u00e9s,Snacks,Snacks sucr\u00e9s,Cacao et d\u00e9riv\u00e9s,Chocolats,Chocolats noirs,Chocolats noirs en tablette,Chocolat noir en tablette extra d\u00e9gustation \u00e0 70% de cacao minimum",1],["Plant-based foods and beverages,Plant-based foods,Snacks,Cereals and potatoes,Salty snacks,Appetizers,Chips and fries,Crisps,Potato crisps,Potato crisps in sunflower oil,fr:Chips de pommes de terre classiques",1],["Snacks,Snacks sucr\u00e9s,Cacao et d\u00e9riv\u00e9s,Confiseries,Confiseries chocolat\u00e9es,Chocolats,Chocolats noirs",1],["Snacks,Snacks sucr\u00e9s,Cacao et d\u00e9riv\u00e9s,Chocolats,Chocolats noirs,Chocolats noirs en tablette",1],["Snacks, Sweet snacks, Biscuits and cakes, Biscuits and crackers, Biscuits, Chocolate biscuits, Filled biscuits, Dark chocolate biscuits, Sandwich biscuits",1],["Snacks,Sweet snacks,Cocoa and its products,Chocolates,Dark chocolates,Extra fine dark chocolates,Cacao-et-derives",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":46,"null_rate":0.0,"stats":{"cardinality":46,"entropy":5.468758439731458,"entropy_ratio":0.9900782290917441,"top_rate":0.06,"top_value":"Snacks,Snacks sucr\u00e9s,Cacao et d\u00e9riv\u00e9s,Chocolats,Chocolats noirs,Chocolat noir en tablette extra d\u00e9gustation \u00e0 70% de cacao minimum"}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=+5.41"},{"code":"outliers","level":"warn","message":"15.6% rows beyond 1.5 IQR"}],"column":"nutrition_score_warning_fruits_vegetables_nuts_estimate_from_ingredients_value","extras":{"histogram":{"counts":[43,1,0,0,0,1],"edges":[0.0,16.666666666666668,33.333333333333336,50.0,66.66666666666667,83.33333333333334,100.0]},"sample":[5.0,6.80681818181818,0.0,0.0,0.0,0.0,0.0,2.67857142857143,0.0,0.0,10.6,13.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,26.35,0.0,0.0,13.0,5.03571428571428,16.3,0.0,0.0,0.0,2.32575757575758,0.347222222222221,0.0,0.0,0.0,0.0,100.0,0.0,0.0,2.47916666666666,0.0,0.0]},"kind":"numeric","n":50,"n_null":5,"n_unique":13,"null_rate":0.1,"stats":{"iqr":2.32575757575758,"kurtosis":30.366197767095322,"max":100.0,"mean":4.531627785794452,"median":0.0,"min":0.0,"n_outliers":7,"outlier_rate":0.15555555555555556,"q1":0.0,"q3":2.32575757575758,"skew":5.410901776680253,"std":15.52257165055811,"zero_rate":0.7111111111111111}},{"alerts":[],"column":"ingredients_from_or_that_may_be_from_palm_oil_n","extras":{"histogram":{"counts":[33,0,0,12,0,2],"edges":[0.0,0.3333333333333333,0.6666666666666666,1.0,1.3333333333333333,1.6666666666666665,2.0]},"sample":[0.0,1.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,1.0,1.0]},"kind":"numeric","n":50,"n_null":3,"n_unique":3,"null_rate":0.06,"stats":{"iqr":1.0,"kurtosis":0.9689904586026494,"max":2.0,"mean":0.3404255319148936,"median":0.0,"min":0.0,"n_outliers":0,"outlier_rate":0.0,"q1":0.0,"q3":1.0,"skew":1.393264559208061,"std":0.5624710908389889,"zero_rate":0.7021276595744681}},{"alerts":[{"code":"long_tail","level":"info","message":"8 singleton categories"},{"code":"null_rate","level":"warn","message":"22.0% null"}],"column":"origins_old","extras":{"singletons":8,"top_values":[["",31],["France",1],["Chambon-la-For\u00eat,France,Cairanne,Provence-Alpes-C\u00f4te d'Azur,Vaucluse,Italie,Source Sainte C\u00e9cile,Source Of\u00e9lia,Source \u00c9l\u00e9onore,Source Emma,Source \u00c9l\u00e9na",1],["United Kingdom",1],["biologique",1],["Morocco",1],["[KAKAO],Los R\u00edos (Provinz),Ecuador",1],["Farine de bl\u00e9: France",1],["Afrique de l'Ouest,Am\u00e9rique du Sud,Madagascar",1]]},"kind":"categorical","n":50,"n_null":11,"n_unique":9,"null_rate":0.22,"stats":{"cardinality":9,"entropy":1.347451305477809,"entropy_ratio":0.4250735600573263,"top_rate":0.7948717948717948,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"76.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_nl","extras":{"singletons":0,"top_values":[["",12]]},"kind":"categorical","n":50,"n_null":38,"n_unique":1,"null_rate":0.76,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"33 singleton categories"}],"column":"expiration_date","extras":{"singletons":33,"top_values":[["",15],["30days",1],["31/07/2020",1],["28/02/24",1],["30/06/2025",1],["25.11.2025",1],["12.12.2018",1],["01/2018",1],["12/06/2021",1],["19-10-2023",1],["31 jul. 2019",1],["30-04-2024",1],["11/10/2025",1],["30 jun. 2020",1],["2024-04-01",1],["31 mai 2019",1],["31-01-2025",1],["05 2026",1],["2021-11-15",1],["31/12/2024",1]]},"kind":"categorical","n":50,"n_null":2,"n_unique":34,"null_rate":0.04,"stats":{"cardinality":34,"entropy":4.364059189593494,"entropy_ratio":0.8578065974671463,"top_rate":0.3125,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"selected_images","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"11 singleton categories"}],"column":"traces_from_ingredients","extras":{"singletons":11,"top_values":[["",39],["\u0153uf",1],["nuts, milk",1],["LUPIN, LAIT, MOUTARDE, GRAINES DE S\u00c9SAME , SOJA, LUPIN, LAIT, MOUTARDE, GRAINES DE S\u00c9SAME, SOJA",1],["fruits \u00e0 coque, lait, soja, s\u00e9same",1],["soja, \u0153ufs, fruits \u00e0 coque, s\u00e9same, moutarde",1],["LUPIN, LAIT, MOUTARDE , SOJA, LUPIN, LAIT, MOUTARDE, SOJA",1],["Schalenfr\u00fcchte, Milch, Soja",1],["LAIT, FRUITS A COQUE, LAIT, FRUITS A COQUE",1],["lait, moutarde, soja",1],[": fruits \u00e0 coque",1],["soja, s\u00e9same",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":12,"null_rate":0.0,"stats":{"cardinality":12,"entropy":1.5212424590621707,"entropy_ratio":0.4243398525803702,"top_rate":0.78,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"50 singleton categories"}],"column":"ingredients_text_with_allergens","extras":{"singletons":50,"top_values":[["milk cream, <span class=\"allergen\">cream</span>, sugar, <span class=\"allergen\">banana</span>, bacteria",1],["C\u00e9r\u00e9ale 50 % (Farine de <span class=\"allergen\">bl\u00e9</span> 34,8 %, farine de <span class=\"allergen\">bl\u00e9 complet</span> 15,2 %), sucre, huiles v\u00e9g\u00e9tales (palme, colza), cacao maigre en poudre 4,5 %, sirop de glucose, amidon de bl\u00e9, poudres \u00e0 lever (carbonates d'ammonium, carbonates de sodium), \u00e9mulsifiant (<span class=\"allergen\">l\u00e9cithines de soja</span>), sel, lait \u00e9cr\u00e9m\u00e9 en poudre, perm\u00e9at de lactos\u00e9rum (de <span class=\"allergen\">lait</span>), ar\u00f4mes. Peut contenir <span class=\"allergen\">\u0153uf</span>.",1],["P\u00e2te de cacao, beurre de cacao, cacao maigre, sucre, vanille.",1],["Coffret fourr\u00e9 au cacao (41,6%) et \u00e0 la vanille (208) - Ingr\u00e9dients Farine de bl\u00e9, sucre, huile v\u00e9g\u00e9tale non hydrog\u00e9n\u00e9e (huile de palme), filtrat de lait, poudre de cacao \u00c9mulsifiant \u00e0 faible teneur en cacao (322) <span class=\"allergen\">L\u00e9cithine de soja</span>) Agent levant (5000) Sucre artificiel (vanilline) Sel Contient du <span class=\"allergen\">lait</span>, du <span class=\"allergen\">bl\u00e9</span> (<span class=\"allergen\">gluten</span>) du <span class=\"allergen\">soja</span>",1],["Farine de <span class=\"allergen\">bl\u00e9</span> 57%, sucre de canne roux, huile de colza, s\u00e9same toast\u00e9 10,6%, germe de bl\u00e9 5,4%, farine compl\u00e8te de bl\u00e9 5,4%, ar\u00f4me naturel, magn\u00e9sium, \u00e9mulsifiant : l\u00e9cithines, poudres \u00e0 lever (tartrates de potassium, carbonates de sodium, carbonates d'ammonium), sel de mer, amidon de bl\u00e9, vitamines (E, PP, B6, B1, B9).",1],["\u041a\u0430\u043a\u0430\u043e\u0432\u0430 \u043c\u0430\u0441\u0430, \u043d\u0438\u0441\u043a\u043e\u043c\u0430\u0441\u043b\u0435\u043d\u043e \u043a\u0430\u043a\u0430\u043e \u043d\u0430 \u043f\u0440\u0430\u0445, \u043a\u0430\u043a\u0430\u043e\u0432\u043e \u043c\u0430\u0441\u043b\u043e, \u0437\u0430\u0445\u0430\u0440, \u0435\u043c\u0443\u043b\u0433\u0430\u0442\u043e\u0440: \u043b\u0435\u0446\u0438\u0442\u0438\u043d (<span class=\"allergen\">\u0441\u043e\u0435\u0432\u0438</span>), \u0435\u043a\u0441\u0442\u0440\u0430\u043a\u0442 \u043e\u0442 \u0432\u0430\u043d\u0438\u043b\u0438\u044f, \u041c\u043e\u0436\u0435 \u0434\u0430 \u0441\u044a\u0434\u044a\u0440\u0436\u0430 \u0441\u043b\u0435\u0434\u0438 \u043e\u0442 \u044f\u0434\u043a\u0438 \u0438 \u043c\u043b\u044f\u043a\u043e,",1],["Eau de source",1],["Farine de <span class=\"allergen\">froment</span>, sucre, graisse v\u00e9g\u00e9tale, sucre inverti, agents levants ( bicarbonate d'ammonium - bicarbonate de sodium), sel, arome.",1],["sugar, cocoa butter, whole milk powder, cocoa mass, <span class=\"allergen\">almonds</span>, emulsifier (<span class=\"allergen\">soya lecithin</span>), flavoring",1],["cocoa mass #, cane sugar #, cocoa butter #, vanilla extract #, may contain <span class=\"allergen\">nuts</span>, <span class=\"allergen\">milk</span>,",1],["\u062f\u0642\u064a\u0642\u0627\u0644\u0642\u0645\u062d\u060c\u0631\u0642\u0627\u0626\u0642 \u0627\u0644\u0634\u0648\u0643\u0648\u0644\u0627\u062a\u064720%[\u0639\u062c\u064a\u0646\u0629 \u0632\u064a\u062a \u0627\u0644\u0646\u062e\u0644\u0629.\u0627\u0644\u0643\u0627\u0643\u0627\u0648\u060c\u0633\u0643\u0631\u060c\u062f\u0643\u0633\u062a\u0631\u0648\u0632 \u0648 \u0645\u0633\u062a\u062d\u0644\u0628",1],["Farine de <span class=\"allergen\">froment</span>, sucre, graisse v\u00e9g\u00e9tale, noix de coco r\u00e2p\u00e9e, poudre de <span class=\"allergen\">lait</span>, poudre de <span class=\"allergen\">lactos\u00e9rum</span>, sucre inverti, agents levants (bicarbonate d'ammonium - bicarbonate de Sodium), sel, ar\u00f4mes.",1],["P\u00e2te \u00e0 tartiner aux <span class=\"allergen\">NOISETTES</span> </span>et au cacao 40% (sucre, huile de palme, <span class=\"allergen\">NOISETTES</span> </span>13%**, <span class=\"allergen\">LAIT</span> </span>\u00e9cr\u00e9m\u00e9 en poudre 8,7%**, cacao maigre 7,4%**, \u00e9mulsifiants : l\u00e9cithines [<span class=\"allergen\">SOJA</span>]; vanilline), farine de <span class=\"allergen\">FROMENT</span> </span>32,5%, graisses v\u00e9g\u00e9tales (palme, palmiste), sucre de canne (contient <span class=\"allergen\">BLE</span>) 8,5%, <span class=\"allergen\">LACTOSE</span>, son de <span class=\"allergen\">BLE</span>, <span class=\"allergen\">LAIT</span> </span>en poudre, miel, poudres \u00e0 lever (diphosphate disodique, carbonate acide de sodium, carbonate acide d'ammonium), farine d'<span class=\"allergen\">ORGE</span> </span>malt\u00e9, cacao maigre en poudre, sel, extrait en poudre de malt d'<span class=\"allergen\">ORGE</span> </span>et de ma\u00efs, amidon de <span class=\"allergen\">FROMENT</span>, \u00e9mulsifiants: l\u00e9cithines [<span class=\"allergen\">SOJA</span>]; vanilline.",1],["Farine compl\u00e8te de <span class=\"allergen\">SEIGLE</span> (77 g*), farine de <span class=\"allergen\">SEIGLE</span> (28 g*), levure, sel. Peut contenir des traces de <span class=\"allergen\">LUPIN</span>, <span class=\"allergen\">LAIT</span>, <span class=\"allergen\">MOUTARDE</span>, <span class=\"allergen\">GRAINES DE S\u00c9SAME</span> </span>et <span class=\"allergen\">SOJA</span>. *en g pour 100 g de produit.",1],["P\u00e2te de cacao, sucre, beurre de cacao, vanille.\r\n\r\nPeut contenir des <span class=\"allergen\">fruits \u00e0 coque</span>, du <span class=\"allergen\">lait</span>, du <span class=\"allergen\">soja</span> et des graines de <span class=\"allergen\">s\u00e9same</span>.",1],["Kartoffeln, Sonnenblumen\u00f6l, Meersalz.",1],["p\u00e2te de cacao*, beurre de cacao*, cacao maigre en poudre*, sucre de canne*, extrait de vanille*, * ingr\u00e9dients issus de l'agriculture biologique",1],["P\u00e2te de cacao, cacao maigre, beurre de cacao, cassonade, vanille",1],["Farine de <span class=\"allergen\">bl\u00e9*</span> 41%, Chocolat noir* 22% (p\u00e2te de cacao*, sucre de canne\", beurre de cacao\"), Sucre de canne* roux non raffin\u00e9, Farine compl\u00e8te de bl\u00e9* 16%, Huile de tournesol ol\u00e9ique*, Ar\u00f4me naturel de vanille, Lait \u00e9cr\u00e9m\u00e9 en poudre, Sel de mer, carbonates d'ammonium, carbonates de sodium, gomme d'acacia*, extraits de romarin* Peut contenir du <span class=\"allergen\">soja</span>, des <span class=\"allergen\">\u0153ufs</span>, des <span class=\"allergen\">fruits \u00e0 coque</span>, des graines de <span class=\"allergen\">s\u00e9same</span> et de la <span class=\"allergen\">moutarde</span>. *Ingr\u00e9dients biologiques.",1],["cocoa mass, sugar, cocoa butter, fat reduced cocoa powder, emulsifier: lecithins (<span class=\"allergen\">soya</span>), natural vanilla flavouring, dark chocolate contains: cocoa solids 74% minimum,",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":50,"null_rate":0.0,"stats":{"cardinality":50,"entropy":5.643856189774725,"entropy_ratio":1.0000000000000002,"top_rate":0.02,"top_value":"milk cream, <span class=\"allergen\">cream</span>, sugar, <span class=\"allergen\">banana</span>, bacteria"}},{"alerts":[{"code":"long_tail","level":"info","message":"50 singleton categories"}],"column":"image_front_thumb_url","extras":{"singletons":50,"top_values":[["https://images.openfoodfacts.org/images/products/611/124/210/0992/front_fr.172.100.jpg",1],["https://images.openfoodfacts.org/images/products/762/221/044/9283/front_en.605.100.jpg",1],["https://images.openfoodfacts.org/images/products/304/692/002/9759/front_en.492.100.jpg",1],["https://images.openfoodfacts.org/images/products/611/103/100/5064/front_fr.56.100.jpg",1],["https://images.openfoodfacts.org/images/products/317/568/001/1480/front_en.221.100.jpg",1],["https://images.openfoodfacts.org/images/products/000/002/099/5553/front_en.314.100.jpg",1],["https://images.openfoodfacts.org/images/products/326/884/000/1008/front_fr.422.100.jpg",1],["https://images.openfoodfacts.org/images/products/336/260/001/1044/front_fr.50.100.jpg",1],["https://images.openfoodfacts.org/images/products/842/519/771/2024/front_en.60.100.jpg",1],["https://images.openfoodfacts.org/images/products/762/221/057/8464/front_en.29.100.jpg",1],["https://images.openfoodfacts.org/images/products/611/125/934/3108/front_fr.25.100.jpg",1],["https://images.openfoodfacts.org/images/products/336/260/001/1228/front_fr.38.100.jpg",1],["https://images.openfoodfacts.org/images/products/800/050/031/0427/front_fr.488.100.jpg",1],["https://images.openfoodfacts.org/images/products/730/040/048/1595/front_fr.242.100.jpg",1],["https://images.openfoodfacts.org/images/products/304/692/002/2651/front_en.159.100.jpg",1],["https://images.openfoodfacts.org/images/products/506/004/264/1000/front_en.179.100.jpg",1],["https://images.openfoodfacts.org/images/products/762/221/058/4724/front_en.95.100.jpg",1],["https://images.openfoodfacts.org/images/products/304/692/002/2606/front_en.102.100.jpg",1],["https://images.openfoodfacts.org/images/products/322/982/010/0234/front_fr.246.100.jpg",1],["https://images.openfoodfacts.org/images/products/000/002/002/2464/front_en.301.100.jpg",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":50,"null_rate":0.0,"stats":{"cardinality":50,"entropy":5.643856189774725,"entropy_ratio":1.0000000000000002,"top_rate":0.02,"top_value":"https://images.openfoodfacts.org/images/products/611/124/210/0992/front_fr.172.100.jpg"}},{"alerts":[],"column":"lc","extras":{"singletons":2,"top_values":[["fr",35],["en",10],["de",3],["bg",1],["ro",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":5,"null_rate":0.0,"stats":{"cardinality":5,"entropy":1.2938747088925062,"entropy_ratio":0.557241506204038,"top_rate":0.7,"top_value":"fr"}},{"alerts":[{"code":"long_tail","level":"info","message":"34 singleton categories"},{"code":"null_rate","level":"warn","message":"28.0% null"}],"column":"ingredients_text_debug","extras":{"singletons":34,"top_values":[["",2],["Lait \u00e9cr\u00e9m\u00e9, cr\u00e9me, sucre, ferments lactiques. mati\u00e8re grosse 3% , sa premi\u00e8re date de publication au maroc 01/10/1993 le changement du packaging 10 ans par 10 ans depuis vingt-cinq ans de l\u2019offre",1],["C\u00e9r\u00e9ale 50,7 % (farine de bl\u00e9 35 %, farine de bl\u00e9 compl\u00e8te 15,7 %), sucre, huiles v\u00e9g\u00e9tales (palme, colza), cacao maigre en poudre 4,5 %, sirop de glucose, amidon de bl\u00e9, poudre \u00e0 lever : (carbonate acide d'ammonium, carbonate acide de sodium, diphosphate disodique), \u00e9mulsifiants : (l\u00e9cithine de soja, l\u00e9cithine de tournesol), sel, lait \u00e9cr\u00e9m\u00e9 en poudre, lactose et prot\u00e9ines de lait, ar\u00f4mes.",1],["P\u00e2te de cacao, beurre de cacao, cacao maige, sucre, vanille. Cacao: 90% minimum.",1],["Farine de bl\u00e9 55,1%, sucre de canne roux, huile de colza 14,3%, s\u00e9same toast\u00e9 11,6%, germe de bl\u00e9 5,2%, levain de seigle d\u00e9vitalis\u00e9 en poudre, fibres d'avoine, calcium, sel de mer, ar\u00f4me naturel, magn\u00e9sium, \u00e9mulsifiant :  l\u00e9cithines de colza, poudres \u00e0 lever : (tartrates de potassium, carbonates de sodium, carbonates d'ammonium), acidifiant : acide malique, prot\u00e9ines de lait, amidon de bl\u00e9, vitamines B1, B6, B9, PP et E (lactose, prot\u00e9ines de lait).",1],["Eau de source",1],["Farine de froment sucre, graisse v\u00e9g\u00e9tale ,sucre inverti, agents levants ( bicarbonate d'ammonium-bicarbonate de sodium, sel , arome. Contient du gluten Peut contenir traces de lait et soja. Conserver dans un endroit frais et sec",1],["Sucre, graisse v\u00e9g\u00e9tale de palmiste hydrog\u00e9n\u00e9e, _Lait_ entier en poudre, Amandes, Cacao d\u00e9graiss\u00e9 en poudre, _lactos\u00e9rum_ en poudre, \u00c9mulsifiant :  L\u00e9cithine de _soja_, Ar\u00f4mes (Vanilline).",1],["P\u00e2te \u00e0 tartiner aux _noisettes_ et au cacao 40% (sucre, huile de palme, _noisettes_ 13%, _lait_ \u00e9cr\u00e9m\u00e9 en poudre 8,7%, cacao maigre 7,4%, \u00e9mulsifiants :  l\u00e9cithines _soja_ ; vanilline), farine de _froment_ 32%, graisses v\u00e9g\u00e9tales (palme, palmiste), sucre de canne 9%, _lactose_, son de _bl\u00e9_, _lait_ en poudre, extrait en poudre de malt d'orge et de ma\u00efs, miel, poudres \u00e0 lever : (disphosfate disodique, carbonate acide d'ammonium, carbonate acide de sodium), cacao maigre, sel, amidon de _froment_, farine d'_orge_ malt\u00e9, l\u00e9cithines _soja_ ; vanilline.",1],["Farine compl\u00e8te de _seigle_, farine de _seigle_ 29%, levure, sel.",1],["P\u00e2te de cacao, sucre, beurre de cacao, vanille.",1],["Pomme de terre, huile de tournesol, sel de mer.",1],["p\u00e2te de cacao, cacao maigre, beurre de cacao, cassonade, vanille.",1],["C\u00e9r\u00e9ales 54%(*farine de _bl\u00e9_, *farine compl\u00e8te de _bl\u00e9_ (15%)), *chocolat noir (25%) (*p\u00e2te de cacao, *sucre de canne non raffin\u00e9, *beurre de cacao), *sucre de canne roux non raffin\u00e9, *huile de tournesol ol\u00e9ique (9,7%), ar\u00f4me naturel de vanille, *_lait_ \u00e9cr\u00e9m\u00e9 en poudre, sel de mer non raffin\u00e9, poudres \u00e0 lever :  carbonates d'ammonium et de sodium, \u00e9paississant :  *gomme d'acacia, antioxydant : , *extraits de romarin.",1],["Kakaomasse*, Zucker, Kakaobutter, Kakaopulver stark ent\u00f6it, Emulgator: Sonnenblumenlecithine ( - e322 - ), nat\u00fcrliches Vanille-Aroma. \r\n* Rainforest Alliance Certified.\r\nKakao: 74% mindestens.",1],["en gras peuvent provoquer yne r\u00e9action chez tes personnes souffrant d'allergies d'intol\u00e9rahces alimentaires. en g pour 100g de produit. ou 4",1],["farine de froment, sucre, Graisse v\u00e9g\u00e9tale , Sucre inverti, Agents levants (Bicarbonate d'ammonium, Bicarbonate de sodium), ar\u00f4me vanille",1],["Farine de _Bl\u00e9_ 73.5 %, mati\u00e8re grasse v\u00e9g\u00e9tale,extrait de malt d'_orge_, sirop de glucose, sel, poudre \u00e0 lever : (carbonate acide d\u2019ammonium, carbonate acide de sodium), _\u0153ufs_, agent de traitement de la farine : (_sulfite_ de sodium_), ar\u00f4me",1],["Pasta de cacao, az\u00facar, manteca de cacao, vainilla Bourbon natural. (Cacao: 70% m\u00ednimo)",1],["Farine de _bl\u00e9_ 68,4%, huile de colza, sirop de sucres issu de fruits, jus concentr\u00e9 de pomme 5,3%, _noisettes_ torr\u00e9\ufb01\u00e9es 5,3%, germe de _bl\u00e9_ 5,2%, \ufb01bres de chicor\u00e9e : fructo-oligosaccharides, extrait de malt d'_orge_, ar\u00f4me naturel de pomme, \u00e9mulsi\ufb01ant :  l\u00e9cithines de colza, amidon de _bl\u00e9_, poudres \u00e0 lever : (tartrates de potassium, carbonates de potassium, carbonates d\u2018ammonium),  prot\u00e9ines de _lait_, vitamines B1, B2, B6, B9, PP et E (_lactose_, prot\u00e9ines de _lait_).",1]]},"kind":"categorical","n":50,"n_null":14,"n_unique":35,"null_rate":0.28,"stats":{"cardinality":35,"entropy":5.114369445886756,"entropy_ratio":0.9970924647735478,"top_rate":0.05555555555555555,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"62.0% null"}],"column":"packagings_materials_main","extras":{"singletons":1,"top_values":[["en:paper-or-cardboard",13],["en:plastic",5],["en:unknown",1]]},"kind":"categorical","n":50,"n_null":31,"n_unique":3,"null_rate":0.62,"stats":{"cardinality":3,"entropy":1.1050139971135322,"entropy_ratio":0.6971862088918521,"top_rate":0.6842105263157895,"top_value":"en:paper-or-cardboard"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"data_quality_dimensions","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"32 singleton categories"}],"column":"serving_size","extras":{"singletons":32,"top_values":[["100g",3],["10 g",3],["42 g",2],["100 g",2],["30 g",2],["20g",1],["1 Square (10 g)",1],["23g",1],["11.5g",1],["25 g",1],["1 L",1],["1 portion (100 g)",1],["13,8 g",1],["11.4 g (1 tranche)",1],["1 serving (100 g)",1],["6 squares (18 g)",1],["50g",1],["20 gram",1],["10 g (1 tranche)",1],["85g",1]]},"kind":"categorical","n":50,"n_null":6,"n_unique":37,"null_rate":0.12,"stats":{"cardinality":37,"entropy":5.10693673217532,"entropy_ratio":0.9803210382628594,"top_rate":0.06818181818181818,"top_value":"100g"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"pnns_groups_1_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"5 singleton categories"}],"column":"origin","extras":{"singletons":5,"top_values":[["",42],["Fabriqu\u00e9 par: Aachen Allemagne",1],["Germe de bl\u00e9 origine ue. S\u00e9same origine non-ue.",1],["France",1],["fabriqu\u00e9 en France.pommes origine UE. noisettes origine UE et non UE",1],["Fabriqu\u00e9 en France par Nutrition et Sant\u00e9. Farine de bl\u00e9: France. Figues : non UE",1]]},"kind":"categorical","n":50,"n_null":3,"n_unique":6,"null_rate":0.06,"stats":{"cardinality":6,"entropy":0.7359222185561922,"entropy_ratio":0.28469357615473484,"top_rate":0.8936170212765957,"top_value":""}},{"alerts":[],"column":"ingredients_lc","extras":{"singletons":0,"top_values":[["fr",35],["en",11],["bg",2],["de",2]]},"kind":"categorical","n":50,"n_null":0,"n_unique":4,"null_rate":0.0,"stats":{"cardinality":4,"entropy":1.2122831218130428,"entropy_ratio":0.6061415609065214,"top_rate":0.7,"top_value":"fr"}},{"alerts":[{"code":"long_tail","level":"info","message":"38 singleton categories"}],"column":"packaging_old","extras":{"singletons":38,"top_values":[["Plastique",3],["",2],["Paquet, Etui en carton, Film en plastique",1],["Cardboard, Container, Packaging, Paperboard, Aluminium wrap, Caja de cart\u00f3n, Box cardboard, Card-box, Foil-wrapper, pt:Papel de aluminio",1],["Sachet, Carton, Paquet, 20 biscuits en 4 sachets",1],["Cardboard, Non-corrugated cardboard, Produkt, fr:FSC mixte, sl:PAP",1],["fr:Point vert,fr:Triman,fr:Bouteille et bouchon 100% recyclable,fr:PET,en:Bottle",1],["M\u00e9tal, Papier, en:Recyclable Metals, Aluminium",1],["Plastic, Envelope, Mixed plastic-packet",1],["Papier, Enveloppe, en:Package paper, en:Paper recycling",1],["M\u00e9tal, en:Recyclable Metals, Aluminium, Carton, Emballage carton",1],["Sachet, Sous atmosph\u00e8re protectrice, en:mixed plastic-packet",1],["Paper, Film",1],["fr:emballage carton, fr:papier aluminium",1],["Film en plastique, Film plastique \u00e0 jeter, \u00c9tui carton \u00e0 recycler",1],["fr:Plastique,fr:Sachet plastique de 3g,en:mixed plastic-packet",1],["Papier, Enveloppe",1],["Papier",1],["Plastic",1],["Container, Caja de cart\u00f3n, Aluminium-wrapper, Card-carton, pt:Papel de aluminio",1]]},"kind":"categorical","n":50,"n_null":7,"n_unique":40,"null_rate":0.14,"stats":{"cardinality":40,"entropy":5.26917434767504,"entropy_ratio":0.9900874746385616,"top_rate":0.06976744186046512,"top_value":"Plastique"}},{"alerts":[{"code":"long_tail","level":"info","message":"13 singleton categories"}],"column":"packaging_text_fr","extras":{"singletons":13,"top_values":[["",34],["1 film en plastique \u00e0 recycler\r\n1 \u00e9tui en papier ondul\u00e9 \u00e0 recycler",1],["carton, plastique",1],["1 bouchon en plastique \u00e0 trier\r\n1 bouteille en plastique \u00e0 trier",1],["1 \u00e9tui en carton \u00e0 recycler\r\n1 feuille en aluminium \u00e0 recycler",1],["1 sachet plastique \u00e0 jeter",1],["1 \u00e9tui en carton \u001f \u00e0 recycler\r\n1 feuille en aluminium \u00e0 recycler",1],["LE TRI +FACILE + BAC DE TRI",1],["4 FILMS PLASTIQUE A JETER \r\n1 \u00c9TUI CARTON \u00c0 RECYCLER",1],["FR LE TRI + FACILE \u00c9TUI 8+ SACHETS BAC DE TRI A consommer de pr\u00e9f\u00e9rence avant le : en France par et Sant\u00e9 S.A.S. 10:02 11914538 112 eCastelnaudary REVEL 30 04 2024",1],["1 \u00e9tui carton \u00e0 recycler, 1 film plastique \u00e0 jeter, 1 barquette plastique \u00e0 jeter.",1],["1 FEUILLE PAPIER \u00c0 RECYCLER, 1 FEUILLE METAL \u00c0 RECYCLER, 1 FILM PLASTIQUE \u00c0 JETER",1],["Sachet, clip \u00e0 recycler",1],["2 sachets en plastique \u00e0 recycler\r\n1 bo\u00eete en carton \u00e0 recycler",1]]},"kind":"categorical","n":50,"n_null":3,"n_unique":14,"null_rate":0.06,"stats":{"cardinality":14,"entropy":1.8742965835390937,"entropy_ratio":0.49228312618834336,"top_rate":0.723404255319149,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"imbalance","level":"warn","message":"top value is 96.0% of rows"}],"column":"nova_group_debug","extras":{"singletons":2,"top_values":[["",48],["no nova group if too many ingredients are unknown: 5 out of 5",1],["no nova group if too many ingredients are unknown: 13 out of 13",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":3,"null_rate":0.0,"stats":{"cardinality":3,"entropy":0.28229218908241477,"entropy_ratio":0.17810654129291523,"top_rate":0.96,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"ingredients_original_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"data_quality_completeness_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"cities_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"countries_hierarchy","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[],"column":"nutriscore_score_opposite","extras":{"histogram":{"counts":[2,2,12,13,7,5,8],"edges":[-40.0,-34.285714285714285,-28.57142857142857,-22.857142857142858,-17.142857142857142,-11.428571428571427,-5.714285714285715,0.0]},"sample":[-20.0,-14.0,-28.0,-9.0,-15.0,0.0,-21.0,-31.0,-20.0,-26.0,-22.0,-28.0,0.0,-25.0,-8.0,-15.0,-21.0,-18.0,-24.0,0.0,-21.0,-23.0,-24.0,-25.0,-4.0,0.0,-1.0,-40.0,-19.0,-36.0,-16.0,-13.0,-2.0,-20.0,-25.0,-18.0,-6.0,-32.0,-10.0,-25.0,-5.0,-20.0,-13.0,-25.0,-19.0,-12.0,-19.0,-28.0,-10.0]},"kind":"numeric","n":50,"n_null":1,"n_unique":28,"null_rate":0.02,"stats":{"iqr":15.0,"kurtosis":-0.5336500018772776,"max":0.0,"mean":-17.46938775510204,"median":-19.0,"min":-40.0,"n_outliers":0,"outlier_rate":0.0,"q1":-25.0,"q3":-10.0,"skew":0.16155636554197175,"std":9.906020982245106,"zero_rate":0.08163265306122448}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"categories_properties_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[],"column":"origins_lc","extras":{"singletons":3,"top_values":[["fr",23],["en",20],["es",2],["de",1],["it",1],["pl",1]]},"kind":"categorical","n":50,"n_null":2,"n_unique":6,"null_rate":0.04,"stats":{"cardinality":6,"entropy":1.5749523572407698,"entropy_ratio":0.6092747406592504,"top_rate":0.4791666666666667,"top_value":"fr"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"ciqual_food_name_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"41 singleton categories"}],"column":"countries","extras":{"singletons":41,"top_values":[["Maroc",5],["Morocco",4],["Morocco,United States",1],["Algeria,Belgium,France,French Polynesia,Germany,Guadeloupe,Hungary,Luxembourg,Martinique,Morocco,New Caledonia,R\u00e9union,Spain,Switzerland,United States",1],["Alg\u00e9rie,Autriche,Belgique,Bulgarie,Canada,R\u00e9publique tch\u00e8que,Finlande,France,Polyn\u00e9sie fran\u00e7aise,Allemagne,Irlande,Italie,Maurice,Maroc,Pays-Bas,Norv\u00e8ge,La R\u00e9union,Roumanie,Singapour,Espagne,Su\u00e8de,Suisse,Tunisie,Royaume-Uni",1],["Belgium, Bulgaria, France, en:switzerland",1],["Austria,Belgium,Bulgaria,Estonia,Finland,France,Germany,Italy,Lithuania,Slovakia,Slovenia,Spain,United Kingdom",1],["Belgique,C\u00f4te d'Ivoire,France,Allemagne,Luxembourg,Mali,Martinique,Russie,Suisse,Royaume-Uni",1],["Algeria,Cameroon,France,Morocco,Spain",1],["France,Irlande,Su\u00e8de,Royaume-Uni",1],["Francia,Alemania,Italia,Marruecos,Portugal,Rumania,Espa\u00f1a,Suiza",1],["France, Italy, Spain, Switzerland, en:reunion",1],["Alg\u00e9rie,Belgique,R\u00e9publique tch\u00e8que,France,Allemagne,Guadeloupe,Italie,Maroc,La R\u00e9union,Espagne,Suisse",1],["France,Germany,Spain,United Kingdom",1],["Belgium, France, United Kingdom, en:ireland",1],["Autriche,Belgique,France,Allemagne,Italie,Maroc,Pays-Bas,La R\u00e9union,Espagne,Suisse",1],["France,Luxembourg,Switzerland",1],["Belgium,Bulgaria,Czech Republic,Finland,Germany,Netherlands,Poland,Spain",1],["Belgique,France,Guadeloupe,Italie,La R\u00e9union,Espagne,Suisse",1],["\u00d6sterreich,Belgien,D\u00e4nemark,Estland,Finnland,Frankreich,Deutschland,Italien,Luxemburg,Malta,Marokko,Niederlande,Portugal,Spanien,Schweden,Schweiz",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":43,"null_rate":0.0,"stats":{"cardinality":43,"entropy":5.251663380285989,"entropy_ratio":0.9678229164426949,"top_rate":0.1,"top_value":"Maroc"}},{"alerts":[{"code":"long_tail","level":"info","message":"11 singleton categories"},{"code":"null_rate","level":"warn","message":"68.0% null"}],"column":"ingredients_text_with_allergens_it","extras":{"singletons":11,"top_values":[["",5],["Pasta di cacao, burro di cacao, cacao magro in polvere, zucchero. Pu\u00f2 contenere <span class=\"allergen\">nocciole</span>, <span class=\"allergen\">mandorle</span>, altra <span class=\"allergen\">frutta a guscio</span>, <span class=\"allergen\">latte</span>, <span class=\"allergen\">soia</span>.",1],["crema alle <span class=\"allergen\">NOCCIOLE</span> </span>e al cacao 40% (zucchero, olio di palma, <span class=\"allergen\">NOCCIOLE</span> </span>13%, <span class=\"allergen\">LATTE</span> </span>Scremato in polvere 8.7%, cacao magro 7,4%, emulsionanti: lecitine (<span class=\"allergen\">SOIA</span>): vanillina), farina di <span class=\"allergen\">FRUMENTO</span> (32%), grassi vegetali (palma, palmisto), zucchero di canna (9%), <span class=\"allergen\">LATTOSIO</span>, crusca di <span class=\"allergen\">FRUMENTO</span>, <span class=\"allergen\">LATTE</span> </span>intero in polvere, estratto in polvere di malto d'<span class=\"allergen\">ORZO</span> </span>e mais, miele, agenti lievitanti (difosfato disodico. carbonato acido di ammonio, carbonato acido di sodio), cacao magro, sale, amido di <span class=\"allergen\">FRUMENTO</span>, farina di <span class=\"allergen\">ORZO</span> </span>maltato, emulsionanti: lecitine (<span class=\"allergen\">SOIA</span>), vanillina.",1],["pasta di cacao, zucchero, burro di cacao, vaniglia",1],["patate, olio di girasole, sale marino.",1],["Pasta di cacao, cacao magro, burro di cacao, zucchero grezzo di canna, vaniglia.",1],["Farina integrale di <span class=\"allergen\">segale</span> (59 g), crusca di <span class=\"allergen\">grano</span> (27 g), fiocchi d'<span class=\"allergen\">avena</span> (12 g), semi di <span class=\"allergen\">sesamo</span> (7,0 g), germe di <span class=\"allergen\">grano</span>, sale. Pu\u00f2 contenere tracce di <span class=\"allergen\">latte</span>.",1],["Farina di <span class=\"allergen\">FRUMENTO</span>, olio di palma, sciroppo di glucosio, estratto di malto d'<span class=\"allergen\">ORZO</span>, agenti lievitanti (carbonati di ammonio, carbonati di sodio), sale, <span class=\"allergen\">UOVA</span>, aroma, agente di trattamento della farina (<span class=\"allergen\">METABISOLFITO</span> di sodio).",1],["Pasta di cacao, zucchero, burro di cacao, vaniglia.",1],["Massa di cacao, zucchero, burro di cacao, emulsionante: lecitine (<span class=\"allergen\">soia</span>); estratto di vaniglia. Pu\u00f2 contenere tracce di <span class=\"allergen\">frutta a guscio</span> e <span class=\"allergen\">latte</span>. Il 40% della massa di cacao proviene da piantagioni selezionate dell'Ecuador.",1],["wdrated potatoes, sunflower oll, <span class=\"allergen\">wheat flour</span>, corn lour.test NRC b ber otin. Emulgator (E471), Salz, Farbstoff (Annatto Norbirin, k hottom (BB). Packaged in a protective atmosphere, (DE) KNAEF Kam ef s1sel colorant (n0rbixine de rocou). Peut contenir lait, <span class=\"allergen\">soja</span>. \u00c0 conse gie vepackt. (FR) SNACK SALE. INGREDIENTS: Pommes de terre disht SNCK SALATO. : Patate disidratate, olio di girasole, (arina d frmu botisiha d annatto). Puo contenere <span class=\"allergen\">latte</span>, sola. Da consumarsi prelerbilmetp SEL NGREDIENTES: Batatas desidratadas, \u00f3leo de girasol, farinha de trigo.(aimha d mh e o, Pode conter leite, <span class=\"allergen\">soja</span>. Consumir de prefer\u00ebncia antes de: ver fundo (BB), Enbazhyer OHTS Pttas deshidratadas, aceite de qirasol, harina de trigo, harina de maiz, haia ca rm e eche, <span class=\"allergen\">soja</span>. Consumir preferentemente antes del: ver parte interior (8B), Enast et 'Releenc itle dn 100 g | RI\" /30g| Eectsge/Ayt acuilo medo 84U bole / Prodoth te /30g ji begja /Valor energetico Tpas (Grassi/ Unjdos / Grasas tan e\u1eadticte Fets\u00e4uren / dont 2214 kJ 664 kJ 530 kcal 159 kcal adulo medio / 8% 31g 3.0 9 9.3 0.9g 17g 13% Produoad by: see yd Aii dd cassi satui / dos quais Producido por urdes thtrde | Glucites | 5% oidrati / MedaCoyK Sabd 55g 7% Uont sucres /di eui *FRSCAME QNg",1],["25% noci, 25% mandorle, 25% uva sultanina (99,5% uva sultanina, olio di semi di girasole), 25% mirtilli rossi americani, essiccati e zuccherati (60% mirtilli rossi americani, 39% zucchero, olio di semi di girasole). Pu\u00f2 contenere tracce di altra <span class=\"allergen\">frutta a guscio</span> e <span class=\"allergen\">arachidi</span>. Confezionato in atmosfera protettiva.",1]]},"kind":"categorical","n":50,"n_null":34,"n_unique":12,"null_rate":0.68,"stats":{"cardinality":12,"entropy":3.274397470347699,"entropy_ratio":0.9133700756113953,"top_rate":0.3125,"top_value":""}},{"alerts":[],"column":"packaging_lc","extras":{"singletons":3,"top_values":[["fr",17],["en",17],["de",5],["pt",2],["it",1],["es",1],["hr",1]]},"kind":"categorical","n":50,"n_null":6,"n_unique":7,"null_rate":0.12,"stats":{"cardinality":7,"entropy":1.991627594161199,"entropy_ratio":0.7094320630828782,"top_rate":0.38636363636363635,"top_value":"fr"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"correctors_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[],"column":"interface_version_created","extras":{"singletons":0,"top_values":[["20120622",29],["20150316.jqm2",18],["20130323.jqm",2]]},"kind":"categorical","n":50,"n_null":1,"n_unique":3,"null_rate":0.02,"stats":{"cardinality":3,"entropy":1.1669527240200814,"entropy_ratio":0.736265194595531,"top_rate":0.5918367346938775,"top_value":"20120622"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"states_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"nutriscore_2021_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"stores_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"50 singleton categories"}],"column":"image_thumb_url","extras":{"singletons":50,"top_values":[["https://images.openfoodfacts.org/images/products/611/124/210/0992/front_fr.172.100.jpg",1],["https://images.openfoodfacts.org/images/products/762/221/044/9283/front_en.605.100.jpg",1],["https://images.openfoodfacts.org/images/products/304/692/002/9759/front_en.492.100.jpg",1],["https://images.openfoodfacts.org/images/products/611/103/100/5064/front_fr.56.100.jpg",1],["https://images.openfoodfacts.org/images/products/317/568/001/1480/front_en.221.100.jpg",1],["https://images.openfoodfacts.org/images/products/000/002/099/5553/front_en.314.100.jpg",1],["https://images.openfoodfacts.org/images/products/326/884/000/1008/front_fr.422.100.jpg",1],["https://images.openfoodfacts.org/images/products/336/260/001/1044/front_fr.50.100.jpg",1],["https://images.openfoodfacts.org/images/products/842/519/771/2024/front_en.60.100.jpg",1],["https://images.openfoodfacts.org/images/products/762/221/057/8464/front_en.29.100.jpg",1],["https://images.openfoodfacts.org/images/products/611/125/934/3108/front_fr.25.100.jpg",1],["https://images.openfoodfacts.org/images/products/336/260/001/1228/front_fr.38.100.jpg",1],["https://images.openfoodfacts.org/images/products/800/050/031/0427/front_fr.488.100.jpg",1],["https://images.openfoodfacts.org/images/products/730/040/048/1595/front_fr.242.100.jpg",1],["https://images.openfoodfacts.org/images/products/304/692/002/2651/front_en.159.100.jpg",1],["https://images.openfoodfacts.org/images/products/506/004/264/1000/front_en.179.100.jpg",1],["https://images.openfoodfacts.org/images/products/762/221/058/4724/front_en.95.100.jpg",1],["https://images.openfoodfacts.org/images/products/304/692/002/2606/front_en.102.100.jpg",1],["https://images.openfoodfacts.org/images/products/322/982/010/0234/front_fr.246.100.jpg",1],["https://images.openfoodfacts.org/images/products/000/002/002/2464/front_en.301.100.jpg",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":50,"null_rate":0.0,"stats":{"cardinality":50,"entropy":5.643856189774725,"entropy_ratio":1.0000000000000002,"top_rate":0.02,"top_value":"https://images.openfoodfacts.org/images/products/611/124/210/0992/front_fr.172.100.jpg"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"categories_properties","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"nucleotides_prev_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"33 singleton categories"}],"column":"allergens_from_ingredients","extras":{"singletons":33,"top_values":[["",15],["en:gluten, froment",2],["en:milk, en:milk, cream, banana",1],["en:milk, en:milk, en:soybeans, en:gluten, en:gluten, en:gluten, bl\u00e9, bl\u00e9 complet, l\u00e9cithines de soja, lait",1],["en:milk, L\u00e9cithine de soja, lait, bl\u00e9, gluten, soja",1],["en:gluten, en:gluten, en:gluten, en:sesame-seeds, en:gluten, bl\u00e9",1],["\u0441\u043e\u0435\u0432\u0438",1],["en:soybeans, en:nuts, en:milk, almonds, soya lecithin",1],["en:milk, en:milk, en:gluten, froment, lait, lactos\u00e9rum",1],["en:soybeans, en:gluten, en:gluten, en:gluten, en:milk, en:gluten, en:gluten, en:soybeans, en:milk, en:nuts, NOISETTES , NOISETTES , LAIT , SOJA, FROMENT , BLE, LACTOSE, BLE, LAIT , ORGE , ORGE , FROMENT, SOJA, NOISETTES, NOISETTES, LAIT, SOJA, FROMENT, BLE, LACTOSE, BLE, LAIT, ORGE, ORGE, FROMENT, SOJA",1],["SEIGLE, SEIGLE, SEIGLE, SEIGLE",1],["en:milk, en:gluten, en:gluten, bl\u00e9*",1],["soya",1],["en:gluten, en:sesame-seeds, en:gluten, SEIGLE , BL\u00c9 , GRAINES DE S\u00c9SAME , BL\u00c9, SEIGLE, BL\u00c9, GRAINES DE S\u00c9SAME, BL\u00c9",1],["en:soybeans, en:soybeans, en:gluten, bl\u00e9, l\u00e9cithine de soja",1],["en:eggs, en:gluten, en:gluten, wheat  flour, eggs",1],["en:soybeans, en:soybeans, en:milk, en:milk, en:milk, en:gluten, Poudre de lait, L\u00e9cithine de soja",1],["en:gluten, en:gluten, en:gluten, en:nuts, en:gluten, bl\u00e9, noisettes, bl\u00e9, orge, bl\u00e9",1],["en:soybeans",1],["en:milk, en:nuts, \u041b\u0415\u0428\u041d\u0418\u0426\u0418, \u0421\u041e\u042f",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":35,"null_rate":0.0,"stats":{"cardinality":35,"entropy":4.43178901109217,"entropy_ratio":0.86401725084216,"top_rate":0.3,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"3 singleton categories"},{"code":"null_rate","level":"warn","message":"90.0% null"}],"column":"ingredients_text_with_allergens_fi","extras":{"singletons":3,"top_values":[["",2],["kaakaomassa, kaakaovoi, v\u00e4h\u00e4rasvainen kaakaojauhe, sokeri, vanilja. Saattaa sis\u00e4lt\u00e4\u00e4 <span class=\"allergen\">hasselp\u00e4hkin\u00e4\u00e4</span>, muita <span class=\"allergen\">p\u00e4hkin\u00f6it\u00e4</span>, <span class=\"allergen\">maitoa</span>, <span class=\"allergen\">soijaa</span>. Tummassa suklaassa kaakaota v\u00e4hint\u00e4\u00e4n 90%.",1],["kaakaomassa, v\u00e4h\u00e4rasvainen kaakaojauhe, kaakaovoi, sokeri, emulgointiaine (<span class=\"allergen\">soijalesitiini</span>), vaniljauute. Suklaassa kaakaota v\u00e4hint\u00e4\u00e4n 85 %. Saattaa sis\u00e4lt\u00e4\u00e4 pieni\u00e4 m\u00e4\u00e4ri\u00e4 <span class=\"allergen\">p\u00e4hkin\u00e4\u00e4</span> ja <span class=\"allergen\">maitoa</span>.",1],["<span class=\"allergen\">VEHN\u00c4JAUHO</span>, palmu\u00f6ljy, t\u00e4rkkelyssiirappi, <span class=\"allergen\">OHRAMALLASUUTE</span>, nostatusaineet ammoniumkarbonaatit, natriumkarbonaatit), suola, <span class=\"allergen\">KANANMUNAT</span>, aromi, jauhonparanne (<span class=\"allergen\">NATRIUMDISULFIITTI</span>).",1]]},"kind":"categorical","n":50,"n_null":45,"n_unique":4,"null_rate":0.9,"stats":{"cardinality":4,"entropy":1.9219280948873623,"entropy_ratio":0.9609640474436811,"top_rate":0.4,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"_keywords","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"16 singleton categories"}],"column":"manufacturing_places","extras":{"singletons":16,"top_values":[["",20],["France",9],["Maroc",2],["Espagne",2],["Aachen",1],["France,Italie",1],["Barilla Sverige AB,682 82,Filipstad,Zweden",1],["United Kingdom",1],["France,Oloron-sainte-marie 64400",1],["\u00dcbach-Palenberg,Heinsberg (Kreis),K\u00f6ln (Regierungsbezirk),Nordrhein-Westfalen,Deutschland",1],["Barilla Deutschland GmbH,Wasastrasze 10,29229,Celle,Allemagne",1],["Biscuits",1],["maroc",1],["Peaugres 07340",1],["Tanger,Maroc",1],["Rausch Schokoladen GmbH,Peine (Landkreis),Niedersachsen,Deutschland",1],["Revel (31250),Annoray,France",1],["Allemagne",1],["85150,Vend\u00e9e,France,Pays de la Loire,La Mothe Achard",1],["Belgique",1]]},"kind":"categorical","n":50,"n_null":1,"n_unique":20,"null_rate":0.02,"stats":{"cardinality":20,"entropy":3.186793784712595,"entropy_ratio":0.7373546516154265,"top_rate":0.40816326530612246,"top_value":""}},{"alerts":[],"column":"pnns_groups_2","extras":{"singletons":4,"top_values":[["Biscuits and cakes",17],["Chocolate products",16],["Appetizers",4],["Pastries",3],["Bread",2],["unknown",2],["Sweets",2],["Dairy desserts",1],["Waters and flavored waters",1],["Cereals",1],["Dried fruits",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":11,"null_rate":0.0,"stats":{"cardinality":11,"entropy":2.5990210737063397,"entropy_ratio":0.7512855752674535,"top_rate":0.34,"top_value":"Biscuits and cakes"}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"90.0% null"}],"column":"ingredients_text_pl","extras":{"singletons":2,"top_values":[["",3],["Miazga kakaowa, cukier, t\u0142uszcz kakaowy, kakao w proszku o obni\u017conej zawarto\u015bci t\u0142uszczu, emulgator: lecytyny (soja); naturalny aromat waniliowy. Czekolada gorzka: masa kakaowa minimum 74 %. Mo\u017ce zawiera\u0107 orzeszki ziemne, orzechy, mleko i gluten (pszenica, \u017cyt j\u0119czmie\u0144, owies, pszenica orkisz i pszenica khorosan).",1],["Miazga kakaowa, cukier, t\u0142uszcz kakaowy, wanilia.",1]]},"kind":"categorical","n":50,"n_null":45,"n_unique":3,"null_rate":0.9,"stats":{"cardinality":3,"entropy":1.3709505944546687,"entropy_ratio":0.8649735207179273,"top_rate":0.6,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"5 singleton categories"},{"code":"null_rate","level":"warn","message":"60.0% null"}],"column":"generic_name_es","extras":{"singletons":5,"top_values":[["",13],["Chocolate negro",2],["Chocolate negro con un 74% de cacao m\u00ednimo",1],["Crackers",1],["Tableta de chocolate negro extrafino con 70% de cacao",1],["Tableta de chocolate negro Ecuador con un 70% de cacao m\u00ednimo",1],["Chocolate Negro 99%",1]]},"kind":"categorical","n":50,"n_null":30,"n_unique":7,"null_rate":0.6,"stats":{"cardinality":7,"entropy":1.8166422780956524,"entropy_ratio":0.6471010358619617,"top_rate":0.65,"top_value":""}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 97.7% of rows"}],"column":"origin_en","extras":{"singletons":1,"top_values":[["",42],["France",1]]},"kind":"categorical","n":50,"n_null":7,"n_unique":2,"null_rate":0.14,"stats":{"cardinality":2,"entropy":0.15935006268563445,"entropy_ratio":0.15935006268563445,"top_rate":0.9767441860465116,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"3 singleton categories"},{"code":"null_rate","level":"warn","message":"68.0% null"}],"column":"generic_name_it","extras":{"singletons":3,"top_values":[["",11],["Cioccolato extra fondente",2],["Cioccolato fondente 90%",1],["Prodotto da forno con segale ricco di fibre alimentari",1],["Crackers",1]]},"kind":"categorical","n":50,"n_null":34,"n_unique":5,"null_rate":0.68,"stats":{"cardinality":5,"entropy":1.4966407621868583,"entropy_ratio":0.6445680921309758,"top_rate":0.6875,"top_value":""}},{"alerts":[{"code":"high_skew","level":"info","message":"skew=+2.23"},{"code":"outliers","level":"warn","message":"17.4% rows beyond 1.5 IQR"}],"column":"ingredients_that_may_be_from_palm_oil_n","extras":{"histogram":{"counts":[38,0,0,7,0,1],"edges":[0.0,0.3333333333333333,0.6666666666666666,1.0,1.3333333333333333,1.6666666666666665,2.0]},"sample":[0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,0.0]},"kind":"numeric","n":50,"n_null":4,"n_unique":3,"null_rate":0.08,"stats":{"iqr":0.0,"kurtosis":4.320808304498272,"max":2.0,"mean":0.1956521739130435,"median":0.0,"min":0.0,"n_outliers":8,"outlier_rate":0.17391304347826086,"q1":0.0,"q3":0.0,"skew":2.229729868569318,"std":0.4531158898801009,"zero_rate":0.8260869565217391}},{"alerts":[{"code":"long_tail","level":"info","message":"12 singleton categories"},{"code":"null_rate","level":"warn","message":"60.0% null"}],"column":"ingredients_text_es","extras":{"singletons":12,"top_values":[["",8],["Pasta de cacao, manteca de cacao, cacao magro en polvo, az\u00facar, vainilla.",1],["Az\u00facar, Grasa vegetal de palmiste parcialmente hidrogenada, Leche en polvo, Almendras, Cacao desgrasado en polvo, suero l\u00e1cteo en polvo, Emulgente (lecitina de soja), aroma (vainilla).",1],["Crema de avellanas y cacao 40% (az\u00facar, manteca de palma, avellanas 13%, leche desnatada en polvo 8,7%, cacao desgrasado 7.4%, emulgentes (lecitinas (soja), vainillina), harina de trigo 32,5%, grasas vegetales (palma, palmiste), az\u00facar de ca\u00f1a 8,5% (trigo), lactosa, salvado de trigo, leche entera en polvo, extracto en polvo de malta de cebada y ma\u00edz, miel, gasificantes (difosfato dis\u00f3dico, carbonato \u00e1cido de sodio, carbonato \u00e1cido de amonio), cacao desgrasado, sal, almid\u00f3n de trigo, harina de cebada, malteada, emulsionantes (lecitinas (soja), vainillina.",1],["70% pasta de cacao*, az\u00facar, rnanteca de cacao, cacao desgrasado en polvo, emulgente: lecitlna de girasol (E-322), aroma natural de vainilla. *Pasta de cacao Ralnforest Alliance Certified cocoa. Cacao: 74% m\u00ednimo.",1],["Harina de _TRIGO_, grasa de palma, extracto de malta de _CEBADA_, gasificantes (carbonatos de amonio, carbonatos de sodio), sal, _HUEVO_, aroma, agente de tratamiento de la harina (_METABISULFITO_ s\u00f3dico).",1],["Pasta de cacao, az\u00facar, manteca de cacao, vainilla.",1],["Pasta de cacao, az\u00facar, manteca de cacao, emulgente: lecitina de girasol (E-322), extracto de vainilla. Cacao: 70% m\u00ednimo.",1],["Copos de avena integral (60%),az\u00facar, aceite refinado de girasol, miel (3%), sal, melaza de ca\u00f1a, emulgente (lecitina de girasol), gasificante (carbonato \u00e1cido de sodio),",1],["Pasta de cacao, cacao magro, manteca de cacao, az\u00facar moreno de ca\u00f1a",1],["Zucker, Kakaobutter, Magermilchpulver, Kakaomasse, Molkenpulver (Milch), Butterreinfett, Emulgator (Sojalecithin), Haselnusspaste, nat\u00fcrliches Aroma",1],["pasta de cacao, az\u00facar, manteca de cacao, emulgente (lecitina de _soja_), vainilla. Cacao: 70% m\u00ednimo.",1],["Pasta de cacao, cacao desgrasado en polvo, manteca de cacao, az\u00facar, leche en polvo, pasta de almendras y avellanas, emulgentes (lecitinas de soja, girasol), aroma",1]]},"kind":"categorical","n":50,"n_null":30,"n_unique":13,"null_rate":0.6,"stats":{"cardinality":13,"entropy":3.1219280948873624,"entropy_ratio":0.8436640866171592,"top_rate":0.4,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"36 singleton categories"}],"column":"teams","extras":{"singletons":36,"top_values":[["pain-au-chocolat",5],["stakano,chocolatine",3],["swipe-studio,pain-au-chocolat",2],["stakano,chocolatine,la-robe-est-bleue",1],["pain-au-chocolat,shark-attack,chocolatine,la-robe-est-bleue,stakano,dietreflux,m,b,c,swipe-studio,gmlaa,heathy-app-cross-eat,specialtiz",1],["stakano,chocolatine,swipe-studio,pain-au-chocolat",1],["chocolatine,la-robe-est-bleue,scaneco,feat,stakano,specialtiz",1],["gmlaa,pain-au-chocolat",1],["stakano,chocolatine,scaneco,gmlaa,pain-au-chocolat",1],["houda,chocolatine,la-robe-est-bleue,stakano",1],["pain-au-chocolat,specialtiz,gmlaa",1],["stakano,chocolatine,pain-au-chocolat",1],["chocolatine,la-robe-est-bleue,pain-au-chocolat,stakano",1],["pain-au-chocolat,shark-attack,swipe-studio,stakano,chocolatine,italy,feat",1],["chocolatine,la-robe-est-bleue,pain-au-chocolat,shark-attack,feat",1],["vendredi,pain-au-chocolat,stakano,chocolatine,gmlaa,italy",1],["swipe-studio,pain-au-chocolat,chocolatine,la-robe-est-bleue,gmlaa",1],["pain-au-chocolat,chocolatine,la-robe-est-bleue,vegan,specialtiz",1],["chocolatine,la-robe-est-bleue,pain-au-chocolat,feat,stakano",1],["swipe-studio,feat,bodysupport,pain-au-chocolat",1]]},"kind":"categorical","n":50,"n_null":4,"n_unique":39,"null_rate":0.08,"stats":{"cardinality":39,"entropy":5.124333087000485,"entropy_ratio":0.9695256623446842,"top_rate":0.10869565217391304,"top_value":"pain-au-chocolat"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"food_groups_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"data_quality_warnings_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"debug_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"main_countries_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"origins_hierarchy","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[],"column":"packagings_complete","extras":{"histogram":{"counts":[23,0,0,0,0,25],"edges":[0.0,0.16666666666666666,0.3333333333333333,0.5,0.6666666666666666,0.8333333333333333,1.0]},"sample":[0.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,1.0,1.0,0.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0]},"kind":"numeric","n":50,"n_null":2,"n_unique":2,"null_rate":0.04,"stats":{"iqr":1.0,"kurtosis":-1.9930434782608695,"max":1.0,"mean":0.5208333333333334,"median":1.0,"min":0.0,"n_outliers":0,"outlier_rate":0.0,"q1":0.0,"q3":1.0,"skew":-0.08340576562283006,"std":0.5048523413086471,"zero_rate":0.4791666666666667}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"nutriscore_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"8 singleton categories"},{"code":"null_rate","level":"warn","message":"78.0% null"}],"column":"ingredients_text_with_allergens_nl","extras":{"singletons":8,"top_values":[["",3],["Cacaomassa, cacaoboter, magere cacaopoeder, suiker.",1],["Aardappelen, zonnebloemolie, zeezout.",1],["Cacaomassa, magere cacao, cacaoboter, bruine suiker, vanille. Kan noten,<span class=\"allergen\"> melk</span>,<span class=\"allergen\"> soja</span>,<span class=\"allergen\"> sesamzaad</span> en tarwe bevatten.",1],["Cacaomassa, suiker, cacaoboter, vanille.",1],["Cacaomassa, magere cacaopoeder, cacaoboter, bruine suiker.",1],["*Referentie inname van een gemiddelde volwassehe (8400 kJ/ 2000 ReJI), 16,7 g 46x4, www,snackmindful,com Milka www,milka,com ER Mondelez France SAS, 6 avenue R\u00e9aumur, CS 50014, 92142 Clamart Cedex, Service Consommateurs N\u00ba Cristal:09,69,39,79,79 BE Mondelez Belgium, Stationsstraat 100, 2800 Mechelen, ND Mondelez Nederland, Verlengde Poolseweg 34, 4818 CL Breda, eu mondelezinternational,com e 100 g COCOA LIFE www,cocoalife,org 8 FR FRANCE ONLY 05 pp 3 045140 105502",1],["<span class=\"allergen\">tarwebloem</span> 47%, <span class=\"allergen\">melkchocolade</span> 29% (suiker, cacaomassa, cacaoboter, weipoeder (van <span class=\"allergen\">melk</span>), magere <span class=\"allergen\">melkpoeder</span>, plantaardige vetten (shea, palm in wisselende verhoudingen), <span class=\"allergen\">melkvet</span>, emulgatoren (<span class=\"allergen\">sojalecithine</span>, E476),<span class=\"allergen\"> lactose</span> (van <span class=\"allergen\">melk</span>), aroma), plantaardige oli\u00ebn (palm, kokos), suiker, suikerstroop, <span class=\"allergen\">tarwezemelen</span>, rijsmiddelen (natriumwaterstofcarbonaat, ammoniumwaterstofcarbonaat), zout, <span class=\"allergen\">tarwekiemen</span>, voedingszuur (citroenzuur)",1],["granen 98.3% (<span class=\"allergen\">volkorentarwemeel</span> 65.8%, <span class=\"allergen\">roggebloem</span>, <span class=\"allergen\">tarwebloem</span> 10.2%, rijstbloem, gemoute <span class=\"allergen\">tarwebloem</span>, <span class=\"allergen\">tarwegriesmeel</span>, boekweitbloem, <span class=\"allergen\">gerstebloem</span>), suiker, magere <span class=\"allergen\">melkpoeder</span>, zout, palmolie, <span class=\"allergen\">tarwekiemen</span>, emulgator (zonnebloemlecithine)",1]]},"kind":"categorical","n":50,"n_null":39,"n_unique":9,"null_rate":0.78,"stats":{"cardinality":9,"entropy":3.0271691184406184,"entropy_ratio":0.9549655329584328,"top_rate":0.2727272727272727,"top_value":""}},{"alerts":[],"column":"created_t","extras":{"histogram":{"counts":[13,8,8,9,7,3,2],"edges":[1337517352.0,1392742718.2857144,1447968084.5714285,1503193450.857143,1558418817.142857,1613644183.4285715,1668869549.7142859,1724094916.0]},"sample":[1474037086.0,1443988064.0,1348995410.0,1724094916.0,1360951415.0,1556354695.0,1337517352.0,1513789538.0,1482948213.0,1550493371.0,1608169426.0,1522578754.0,1548751374.0,1436854915.0,1462636415.0,1366890201.0,1562679146.0,1462865556.0,1366110700.0,1342650111.0,1441640147.0,1518647490.0,1575320881.0,1342889958.0,1341598583.0,1612354382.0,1595696689.0,1374255877.0,1552261744.0,1342649387.0,1401619775.0,1582461760.0,1607720821.0,1379153284.0,1380743001.0,1433065227.0,1617103920.0,1424944949.0,1349035684.0,1485808955.0,1651269382.0,1693758410.0,1534511932.0,1484144730.0,1526828413.0,1477818675.0,1415119614.0,1660685390.0,1464966440.0,1415379643.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":50,"null_rate":0.0,"stats":{"iqr":169369262.75,"kurtosis":-0.8095226679595049,"max":1724094916.0,"mean":1483136236.02,"median":1475927880.5,"min":1337517352.0,"n_outliers":0,"outlier_rate":0.0,"q1":1385962194.5,"q3":1555331457.25,"skew":0.3311251605312739,"std":104269999.74070254,"zero_rate":0.0}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"traces_hierarchy","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"generic_name_nb","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"15 singleton categories"},{"code":"null_rate","level":"warn","message":"66.0% null"}],"column":"ingredients_text_with_allergens_de","extras":{"singletons":15,"top_values":[["",2],["Kakaomasse, Kakaobutter, fettarmes Kakaopulver, Zucker, Vanille",1],["Kakaomasse, fettarmes Kakaopulver, Kakaobutter, Zucker, Emulgator: Lecithine (<span class=\"allergen\">Soja</span>); Vanilleextrakt.",1],["Nuss-Nugat-Creme 40 % (Zucker, Palm\u00f6l, <span class=\"allergen\">HASELN\u00dcSSE</span> 13 %, <span class=\"allergen\">MAGERMILCHPULVER</span> 8.7%, fettarmer Kakao 7,4 %, Emulgator Lecithine (<span class=\"allergen\">SOJA</span>), Vanillin), <span class=\"allergen\">WEIZENMEHL</span> (32,5 %), pflanzliche Fette (Palm, Palmkern), Rohrzucker 8,5 % (enth\u00e4lt <span class=\"allergen\">WEIZEN</span>), <span class=\"allergen\">MILCHZUCKER</span>, <span class=\"allergen\">WEIZENKLEIE</span>, <span class=\"allergen\">VOLLMILCHPULVER</span>, <span class=\"allergen\">GERSTENMALZ</span> - und Maisextraktpulver, Honig, Backtriebmittel: Dinatriumdiphosphat, Natriumhydrogencarbonat, Ammoniumhydrogencarbonat; fettarmer Kakao, Salz, <span class=\"allergen\">WEIZENST\u00c4RKE</span>, <span class=\"allergen\">GERSTENMALZMEHL</span>, Emulgator Lecithine (<span class=\"allergen\">SOJA</span>), Vanillin",1],["Kakaomasse, Zucker, Kakaobutter, Vanille",1],["Kartoffeln, Sonnenblumen\u00f6l, Meersalz.",1],["Kakaomasse, fettarmes Kakaopulver, Kakaobutter, Rohrzucker, Vanille. Kann <span class=\"allergen\">Schalenfr\u00fcchte</span>, <span class=\"allergen\">Milch</span>, <span class=\"allergen\">Soja</span>, <span class=\"allergen\">Sesamsamen</span> und <span class=\"allergen\">Weizen</span> enthalten.",1],["kakaomass of*, zucker, kakaobutter, kakaopulver stark ent\u00f6it, emulgator: sonnenblumenlecithine (e-322), nat\u00fcrliche in vanille-aroma, \r\n* rainforest alliance certified, \r\ncocoa: 74% mindestens,",1],["<span class=\"allergen\">WEIZENMEHL</span>, Palm\u00f6l, Glukosesirup, <span class=\"allergen\">GERSTENMALZEXTRAKT</span>, Backtriebmittel (Ammoniumcarbonate, Natriumcarbonate), Speisesalz 1,4 %, <span class=\"allergen\">EIER</span>, Aroma, Mehlbehandlungsmittel (<span class=\"allergen\">NATRIUMMETABISULFIT</span>).",1],["Kakaomasse, Zucker, Kakaobutter, Emulgator: Lecithine (<span class=\"allergen\">Soja</span>); Vanilleextrakt.",1],["Kartoffelp\u00fcreepulver, pflanzliche \u00d6le (Sonnenblume, Palm, Mais) in ver\u00e4nderlichen Gewichtsanteilen, <span class=\"allergen\">Weizenmehl</span>, Maismehl, Reismehl, Maltodextrin, Emulgator (E471), Salz, Farbstoff (Annatto Norbixin).",1],["Kakaomasse, fettarmes Kakaopulver, Kakaobutter . Kann <span class=\"allergen\">Schalenfr\u00fcchte</span>, <span class=\"allergen\">Milch</span> und <span class=\"allergen\">Soja</span> enthalten.",1],["Alpenmilch Schokolade.\nZutaten: Zucker, Kakaobutter, <span class=\"allergen\">Magermilchpulver</span>, Kakaomasse, <span class=\"allergen\">S\u00fc\u00dfmolkenpulver</span> (aus Milch), <span class=\"allergen\">Butterreinfett</span>, <span class=\"allergen\">Haseln\u00fcsse</span>, Emulgatoren (<span class=\"allergen\">Sojalecithin</span>, E476), Aroma. Kakao: 30 % mindestens.\nKann andere <span class=\"allergen\">N\u00fcsse</span> und <span class=\"allergen\">Weizen</span> enthalten.\nOhne Farbstoffe** und Konservierungsstoffe** -**Gem\u00e4\u00df rechtlicher Vorschriften.",1],["Kakaomasse\u00b9, Rohrzucker\u00b9, Kakaobutter\u00b9, Emulgator: Lecithine (<span class=\"allergen\">Soja</span>)\u00b9. \u00b9aus kontrolliert \u00f6kologischem Anbau.",1],["25% <span class=\"allergen\">Walnusskerne</span>, 25% <span class=\"allergen\">Mandeln</span>, 25% Sultaninen geschwefelt (Sultaninen, Sonnenblumen\u00f6l, Konservierungsstoff: <span class=\"allergen\">Schwefeldioxid</span>), 25% Cranberries (Cranberries, Zucker, Sonnenblumen\u00f6l).",1],["Kakaomasse, Zucker, Kakaobutter, Emulgator (<span class=\"allergen\">Sojalecithin</span>), Vanille. Kann <span class=\"allergen\">Haseln\u00fcsse</span>, <span class=\"allergen\">Mandeln</span>, <span class=\"allergen\">Milch</span> enthalten.",1]]},"kind":"categorical","n":50,"n_null":33,"n_unique":16,"null_rate":0.66,"stats":{"cardinality":16,"entropy":3.9698157824268097,"entropy_ratio":0.9924539456067024,"top_rate":0.11764705882352941,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"12 singleton categories"},{"code":"null_rate","level":"warn","message":"62.0% null"}],"column":"ingredients_text_with_allergens_es","extras":{"singletons":12,"top_values":[["",7],["Pasta de cacao, manteca de cacao, cacao magro en polvo, az\u00facar, vainilla.",1],["Az\u00facar, Grasa vegetal de palmiste parcialmente hidrogenada, Leche en polvo, <span class=\"allergen\">Almendras</span>, Cacao desgrasado en polvo, suero l\u00e1cteo en polvo, Emulgente (<span class=\"allergen\">lecitina de soja</span>), aroma (vainilla).",1],["Crema de avellanas y cacao 40% (az\u00facar, manteca de palma, <span class=\"allergen\">avellanas</span> 13%, leche desnatada en polvo 8,7%, cacao desgrasado 7.4%, emulgentes (lecitinas (<span class=\"allergen\">soja</span>), vainillina), <span class=\"allergen\">harina de trigo</span> 32,5%, grasas vegetales (palma, palmiste), az\u00facar de ca\u00f1a 8,5% (<span class=\"allergen\">trigo</span>), <span class=\"allergen\">lactosa</span>, salvado de trigo, leche entera en polvo, extracto en polvo de malta de cebada y ma\u00edz, miel, gasificantes (difosfato dis\u00f3dico, carbonato \u00e1cido de sodio, carbonato \u00e1cido de amonio), cacao desgrasado, sal, almid\u00f3n de trigo, harina de cebada, malteada, emulsionantes (lecitinas (<span class=\"allergen\">soja</span>), vainillina.",1],["70% pasta de cacao*, az\u00facar, rnanteca de cacao, cacao desgrasado en polvo, emulgente: lecitlna de girasol (E-322), aroma natural de vainilla. *Pasta de cacao Ralnforest Alliance Certified cocoa. Cacao: 74% m\u00ednimo.",1],["Harina de <span class=\"allergen\">TRIGO</span>, grasa de palma, extracto de malta de <span class=\"allergen\">CEBADA</span>, gasificantes (carbonatos de amonio, carbonatos de sodio), sal, <span class=\"allergen\">HUEVO</span>, aroma, agente de tratamiento de la harina (<span class=\"allergen\">METABISULFITO</span> s\u00f3dico).",1],["Pasta de cacao, az\u00facar, manteca de cacao, vainilla.",1],["Pasta de cacao, az\u00facar, manteca de cacao, emulgente: lecitina de girasol (E-322), extracto de vainilla. Cacao: 70% m\u00ednimo.",1],["Copos de avena integral (60%),az\u00facar, aceite refinado de girasol, miel (3%), sal, melaza de ca\u00f1a, emulgente (lecitina de girasol), gasificante (carbonato \u00e1cido de sodio),",1],["Pasta de cacao, cacao magro, manteca de cacao, az\u00facar moreno de ca\u00f1a",1],["Zucker, Kakaobutter, Magermilchpulver, Kakaomasse, Molkenpulver (Milch), Butterreinfett, Emulgator (Sojalecithin), Haselnusspaste, nat\u00fcrliches Aroma",1],["pasta de cacao, az\u00facar, manteca de cacao, emulgente (lecitina de <span class=\"allergen\">soja</span>), vainilla. Cacao: 70% m\u00ednimo.",1],["Pasta de cacao, cacao desgrasado en polvo, manteca de cacao, az\u00facar, leche en polvo, pasta de almendras y <span class=\"allergen\">avellanas</span>, emulgentes (<span class=\"allergen\">lecitinas de soja</span>, girasol), aroma",1]]},"kind":"categorical","n":50,"n_null":31,"n_unique":13,"null_rate":0.62,"stats":{"cardinality":13,"entropy":3.2136388579486774,"entropy_ratio":0.8684478339679701,"top_rate":0.3684210526315789,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"45 singleton categories"}],"column":"product_name_fr","extras":{"singletons":45,"top_values":[["Henry\u2019s",2],["Excellence Noir Subtil Doux 70% Cacao",2],["Perly",1],["Prince Go\u00fbt Chocolat",1],["Excellence Noir Prodigieux 90% Cacao",1],["Tonik",1],["S\u00e9same",1],["Chocolat noir - 85% cacao",1],["CRISTALINE Eau De Source 0.5L",1],["Maruja",1],["Dark chocolate 70%",1],["KING COOKIES",1],["Sable coco Henry s 42g",1],["Biscuits croquants au coeur onctueux de Nutella\u00ae",1],["Tartine croustillante Authentique",1],["Excellence Noir Intense 70% Cacao",1],["Lightly sea salted crisps",1],["Dark chocolate",1],["Excellence Noir Puissant 85% Cacao",1],["Fourr\u00e9s Chocolat Noir",1]]},"kind":"categorical","n":50,"n_null":1,"n_unique":47,"null_rate":0.02,"stats":{"cardinality":47,"entropy":5.533077191053984,"entropy_ratio":0.9961272271993351,"top_rate":0.04081632653061224,"top_value":"Henry\u2019s"}},{"alerts":[{"code":"long_tail","level":"info","message":"29 singleton categories"}],"column":"stores","extras":{"singletons":29,"top_values":[["",14],["Lidl",5],["Carrefour Market,Magasins U,Auchan,Intermarch\u00e9,Carrefour,Casino,Cora,Bi1,carrefour.fr,Netto,bannete,E.Leclerc",1],["Carrefour,G\u00e9ant,kupsch,Magasins U,Esselunga,Lindt,carrefour.fr,COOP,El Corte Ingl\u00e9s,Consum,Meny,Walmart",1],["E.Leclerc,Carrefour,Auchan,Monoprix,carrefour.fr,Lidl,Intermarch\u00e9",1],["Sogeres,Holyday Inn Toulon",1],["Leclerc,Magasins U,carrefour.fr,Intermarch\u00e9",1],["Magasins U,Carrefour,carrefour.fr,Carrefour Market,E.leclerc,Carrefour City,Intermarch\u00e9",1],["Carrefour,Magasins U,Sainsbury's,carrefour.fr,Plus,Albert Heijn,Asda,El Corte Ingl\u00e9s",1],["Tesco",1],["Magasins U,Carrefour,Auchan,carrefour.fr,E.leclerc,Carrefour Market,Carrefour City",1],["LIDL,Monoprix,Carrefour,Auchan,Intermarch\u00e9,Carrefour Market,Leclerc",1],["Dia,Auchan,Magasins U,carrefour.fr,monoprix,Centre Commercial E.Leclerc",1],["private shops,groceries,Marjane",1],["Carrefour,E.Leclerc,REWE",1],["biocoop",1],["Franprix,Magasins U,Leclerc,E Leclerc,Delhaize,carrefour.fr,Carrefour,Auchan,Carrefour Market",1],["Sainsbury's,Coop",1],["E.leclerc",1],["Franprix,Magasins U,Carrefour,carrefour.fr,Carrefour City",1]]},"kind":"categorical","n":50,"n_null":2,"n_unique":31,"null_rate":0.04,"stats":{"cardinality":31,"entropy":4.232616471903588,"entropy_ratio":0.8543497687060895,"top_rate":0.2916666666666667,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"50 singleton categories"}],"column":"_id","extras":{"singletons":50,"top_values":[["6111242100992",1],["7622210449283",1],["3046920029759",1],["6111031005064",1],["3175680011480",1],["20995553",1],["3268840001008",1],["3362600011044",1],["8425197712024",1],["7622210578464",1],["6111259343108",1],["3362600011228",1],["8000500310427",1],["7300400481595",1],["3046920022651",1],["5060042641000",1],["7622210584724",1],["3046920022606",1],["3229820100234",1],["20022464",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":50,"null_rate":0.0,"stats":{"cardinality":50,"entropy":5.643856189774725,"entropy_ratio":1.0000000000000002,"top_rate":0.02,"top_value":"6111242100992"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"nutriments","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"editors","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"27 singleton categories"}],"column":"max_imgid","extras":{"singletons":27,"top_values":[["47",3],["108",2],["13",2],["12",2],["6",2],["7",2],["88",2],["15",2],["82",2],["68",2],["79",2],["28",1],["235",1],["9",1],["105",1],["80",1],["158",1],["11",1],["73",1],["66",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":38,"null_rate":0.0,"stats":{"cardinality":38,"entropy":5.148758439731457,"entropy_ratio":0.9811031929350993,"top_rate":0.06,"top_value":"47"}},{"alerts":[],"column":"nutriscore_grade","extras":{"singletons":1,"top_values":[["e",27],["d",9],["c",7],["a",4],["b",2],["unknown",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":6,"null_rate":0.0,"stats":{"cardinality":6,"entropy":1.9126007492587709,"entropy_ratio":0.7398949689696431,"top_rate":0.54,"top_value":"e"}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 97.8% of rows"}],"column":"product_quantity_unit","extras":{"singletons":1,"top_values":[["g",44],["ml",1]]},"kind":"categorical","n":50,"n_null":5,"n_unique":2,"null_rate":0.1,"stats":{"cardinality":2,"entropy":0.15374218032876188,"entropy_ratio":0.15374218032876188,"top_rate":0.9777777777777777,"top_value":"g"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"ingredients_analysis_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"46 singleton categories"}],"column":"ingredients_text_with_allergens_fr","extras":{"singletons":46,"top_values":[["",2],["<span class=\"allergen\">Lait \u00e9cr\u00e9m\u00e9</span>, <span class=\"allergen\">cr\u00e8me</span>, SUcre, ferments laciques",1],["C\u00e9r\u00e9ale 50 % (Farine de <span class=\"allergen\">bl\u00e9</span> 34,8 %, farine de <span class=\"allergen\">bl\u00e9 complet</span> 15,2 %), sucre, huiles v\u00e9g\u00e9tales (palme, colza), cacao maigre en poudre 4,5 %, sirop de glucose, amidon de bl\u00e9, poudres \u00e0 lever (carbonates d'ammonium, carbonates de sodium), \u00e9mulsifiant (<span class=\"allergen\">l\u00e9cithines de soja</span>), sel, lait \u00e9cr\u00e9m\u00e9 en poudre, perm\u00e9at de lactos\u00e9rum (de <span class=\"allergen\">lait</span>), ar\u00f4mes. Peut contenir <span class=\"allergen\">\u0153uf</span>.",1],["P\u00e2te de cacao, beurre de cacao, cacao maigre, sucre, vanille.",1],["Coffret fourr\u00e9 au cacao (41,6%) et \u00e0 la vanille (208) - Ingr\u00e9dients Farine de bl\u00e9, sucre, huile v\u00e9g\u00e9tale non hydrog\u00e9n\u00e9e (huile de palme), filtrat de lait, poudre de cacao \u00c9mulsifiant \u00e0 faible teneur en cacao (322) <span class=\"allergen\">L\u00e9cithine de soja</span>) Agent levant (5000) Sucre artificiel (vanilline) Sel Contient du <span class=\"allergen\">lait</span>, du <span class=\"allergen\">bl\u00e9</span> (<span class=\"allergen\">gluten</span>) du <span class=\"allergen\">soja</span>",1],["Farine de <span class=\"allergen\">bl\u00e9</span> 57%, sucre de canne roux, huile de colza, s\u00e9same toast\u00e9 10,6%, germe de bl\u00e9 5,4%, farine compl\u00e8te de bl\u00e9 5,4%, ar\u00f4me naturel, magn\u00e9sium, \u00e9mulsifiant : l\u00e9cithines, poudres \u00e0 lever (tartrates de potassium, carbonates de sodium, carbonates d'ammonium), sel de mer, amidon de bl\u00e9, vitamines (E, PP, B6, B1, B9).",1],["P\u00e2te de cacao, cacao maigre en poudre, beurre de cacao, sucre, \u00e9mulsifiant : l\u00e9cithines (<span class=\"allergen\">soja</span>) ; extrait de vanille. Traces \u00e9ventuelles de <span class=\"allergen\">fruits \u00e0 coque</span> et de <span class=\"allergen\">lait</span>.",1],["Eau de source",1],["Farine de <span class=\"allergen\">froment</span>, sucre, graisse v\u00e9g\u00e9tale, sucre inverti, agents levants ( bicarbonate d'ammonium - bicarbonate de sodium), sel, arome.",1],["Sucre, graisse vegetale de palmiste hidrogen\u00e9e, Lait Enteir en poudre, <span class=\"allergen\">Amandes</span>, Cacao D\u00e9graiss\u00e9 en poudre, lactoserum en poudre, Emulsifiant L\u00e9cithine de soja, Ar\u00f4mes (Vainilline).",1],["\u062f\u0642\u064a\u0642\u0627\u0644\u0642\u0645\u062d\u060c\u0631\u0642\u0627\u0626\u0642 \u0627\u0644\u0634\u0648\u0643\u0648\u0644\u0627\u062a\u064720%[\u0639\u062c\u064a\u0646\u0629 \u0632\u064a\u062a \u0627\u0644\u0646\u062e\u0644\u0629.\u0627\u0644\u0643\u0627\u0643\u0627\u0648\u060c\u0633\u0643\u0631\u060c\u062f\u0643\u0633\u062a\u0631\u0648\u0632 \u0648 \u0645\u0633\u062a\u062d\u0644\u0628",1],["Farine de <span class=\"allergen\">froment</span>, sucre, graisse v\u00e9g\u00e9tale, noix de coco r\u00e2p\u00e9e, poudre de <span class=\"allergen\">lait</span>, poudre de <span class=\"allergen\">lactos\u00e9rum</span>, sucre inverti, agents levants (bicarbonate d'ammonium - bicarbonate de Sodium), sel, ar\u00f4mes.",1],["P\u00e2te \u00e0 tartiner aux <span class=\"allergen\">NOISETTES</span> </span>et au cacao 40% (sucre, huile de palme, <span class=\"allergen\">NOISETTES</span> </span>13%**, <span class=\"allergen\">LAIT</span> </span>\u00e9cr\u00e9m\u00e9 en poudre 8,7%**, cacao maigre 7,4%**, \u00e9mulsifiants : l\u00e9cithines [<span class=\"allergen\">SOJA</span>]; vanilline), farine de <span class=\"allergen\">FROMENT</span> </span>32,5%, graisses v\u00e9g\u00e9tales (palme, palmiste), sucre de canne (contient <span class=\"allergen\">BLE</span>) 8,5%, <span class=\"allergen\">LACTOSE</span>, son de <span class=\"allergen\">BLE</span>, <span class=\"allergen\">LAIT</span> </span>en poudre, miel, poudres \u00e0 lever (diphosphate disodique, carbonate acide de sodium, carbonate acide d'ammonium), farine d'<span class=\"allergen\">ORGE</span> </span>malt\u00e9, cacao maigre en poudre, sel, extrait en poudre de malt d'<span class=\"allergen\">ORGE</span> </span>et de ma\u00efs, amidon de <span class=\"allergen\">FROMENT</span>, \u00e9mulsifiants: l\u00e9cithines [<span class=\"allergen\">SOJA</span>]; vanilline.",1],["Farine compl\u00e8te de <span class=\"allergen\">SEIGLE</span> (77 g*), farine de <span class=\"allergen\">SEIGLE</span> (28 g*), levure, sel. Peut contenir des traces de <span class=\"allergen\">LUPIN</span>, <span class=\"allergen\">LAIT</span>, <span class=\"allergen\">MOUTARDE</span>, <span class=\"allergen\">GRAINES DE S\u00c9SAME</span> </span>et <span class=\"allergen\">SOJA</span>. *en g pour 100 g de produit.",1],["P\u00e2te de cacao, sucre, beurre de cacao, vanille.\r\n\r\nPeut contenir des <span class=\"allergen\">fruits \u00e0 coque</span>, du <span class=\"allergen\">lait</span>, du <span class=\"allergen\">soja</span> et des graines de <span class=\"allergen\">s\u00e9same</span>.",1],["p\u00e2te de cacao*, beurre de cacao*, cacao maigre en poudre*, sucre de canne*, extrait de vanille*, * ingr\u00e9dients issus de l'agriculture biologique",1],["P\u00e2te de cacao, cacao maigre, beurre de cacao, cassonade, vanille",1],["Farine de <span class=\"allergen\">bl\u00e9*</span> 41%, Chocolat noir* 22% (p\u00e2te de cacao*, sucre de canne\", beurre de cacao\"), Sucre de canne* roux non raffin\u00e9, Farine compl\u00e8te de bl\u00e9* 16%, Huile de tournesol ol\u00e9ique*, Ar\u00f4me naturel de vanille, Lait \u00e9cr\u00e9m\u00e9 en poudre, Sel de mer, carbonates d'ammonium, carbonates de sodium, gomme d'acacia*, extraits de romarin* Peut contenir du <span class=\"allergen\">soja</span>, des <span class=\"allergen\">\u0153ufs</span>, des <span class=\"allergen\">fruits \u00e0 coque</span>, des graines de <span class=\"allergen\">s\u00e9same</span> et de la <span class=\"allergen\">moutarde</span>. *Ingr\u00e9dients biologiques.",1],["P\u00e2te de cacao, sucre, beurre de cacao, cacao maigre en poudre, \u00e9mulsifiant : l\u00e9cithines (<span class=\"allergen\">soja</span>), ar\u00f4me naturel de vanille.",1],["Farine compl\u00e8te de <span class=\"allergen\">SEIGLE</span> </span>59 g*, son de <span class=\"allergen\">BL\u00c9</span> </span>27 g*, flocons d'AVOINE 12 g*, <span class=\"allergen\">GRAINES DE S\u00c9SAME</span> </span>7,0 g*, germe de <span class=\"allergen\">BL\u00c9</span>, sel. *en g pour 100 g de produit fini. Peut contenir des traces de <span class=\"allergen\">LUPIN</span>, <span class=\"allergen\">LAIT</span>, <span class=\"allergen\">MOUTARDE</span> </span>et <span class=\"allergen\">SOJA</span>.",1]]},"kind":"categorical","n":50,"n_null":2,"n_unique":47,"null_rate":0.04,"stats":{"cardinality":47,"entropy":5.543295834054491,"entropy_ratio":0.9979669030553475,"top_rate":0.041666666666666664,"top_value":""}},{"alerts":[],"column":"interface_version_modified","extras":{"singletons":0,"top_values":[["20150316.jqm2",42],["20190830",8]]},"kind":"categorical","n":50,"n_null":0,"n_unique":2,"null_rate":0.0,"stats":{"cardinality":2,"entropy":0.6343095546405662,"entropy_ratio":0.6343095546405662,"top_rate":0.84,"top_value":"20150316.jqm2"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"data_sources_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"35 singleton categories"}],"column":"ingredients_text_with_allergens_en","extras":{"singletons":35,"top_values":[["",7],["milk cream, <span class=\"allergen\">cream</span>, sugar, <span class=\"allergen\">banana</span>, bacteria",1],["<span class=\"allergen\">WHEAT</span> </span>flour 35%, whole <span class=\"allergen\">WHEAT</span> </span>flour 15.7%, sugar, vegetable oils (palm, rapeseed), low-fat cocoa powder 4.5%, glucose syrup, <span class=\"allergen\">WHEAT</span> </span>starch, raising agents (ammonium bicarbonate, sodium bicarbonate, disodium diphosphate), emulsifiers (<span class=\"allergen\">SOY</span> </span>lecithin, sunflower lecithin), salt, skimmed <span class=\"allergen\">MILK</span> </span>powder, <span class=\"allergen\">lactose</span> and <span class=\"allergen\">MILK</span> </span>proteins, flavors, MAY CONTAIN <span class=\"allergen\">EGG</span>.",1],["cocoa mass, cocoa butter, fat reduced cocoa, sugar, vanilla",1],["<span class=\"allergen\">Wheat flour</span>, brown cane sugar, rapeseed oil, toasted sesame 10.6%, wheat germ 5.4%, whole wheat flour 5.4%, natural flavor, magnesium, emulsifier: lecithins, raising agents (potassium tartrates, sodium carbonates, ammonium carbonates), sea salt, wheat starch, vitamins (E, PP, B6, B1, B9).",1],["cocoa mass, low-fat cocoa powder, cocoa butter, sugar, emulsifier: lecithin (<span class=\"allergen\">soy</span>), vanilla extract, may contain traces of <span class=\"allergen\">nuts</span> and <span class=\"allergen\">milk</span>,",1],["Hhhhh",1],["sugar, cocoa butter, whole milk powder, cocoa mass, <span class=\"allergen\">almonds</span>, emulsifier (<span class=\"allergen\">soya lecithin</span>), flavoring",1],["cocoa mass #, cane sugar #, cocoa butter #, vanilla extract #, may contain <span class=\"allergen\">nuts</span>, <span class=\"allergen\">milk</span>,",1],["wholemeal rye flour (77 g*), <span class=\"allergen\">rye flour</span> (28 g*), yeast, salt, may contain traces of <span class=\"allergen\">milk</span> and <span class=\"allergen\">sesame seeds</span>, *in g per 100 g of product,",1],["cocoa paste, sugar, cocoa butter, vanilla,",1],["Potatoes, sunflower oil, sea salt. May contain <span class=\"allergen\">Milk</span>.",1],["cocoa mass, cocoa butter, fat-reduced cocoa powder, cane sugar, vanilla extract",1],["P\u00e2te de cacao, cacao maigre, beurre de cacao, cassonade, vanille bourbon naturelle en gousse.",1],["<span class=\"allergen\">Wheat</span> flour 39%, dark chocolate 25% (cocoa mass, cane sugar, cocoa butter), unrefined brown cane sugar, wholemeal <span class=\"allergen\">wheat</span> flour 15%, oleic sunflower oil, natural vanilla flavouring, skimmed <span class=\"allergen\">milk</span> powder, sea salt, raising agents: ammonium carbonates, sodium carbonates, thickener: acacia gum, antioxidant: rosemary extract.",1],["cocoa mass, sugar, cocoa butter, fat reduced cocoa powder, emulsifier: lecithins (<span class=\"allergen\">soya</span>), natural vanilla flavouring, dark chocolate contains: cocoa solids 74% minimum,",1],["whole rye flour (57 g), wheat bran (27 g), oatmeal (13 g), <span class=\"allergen\">sesame seeds</span> (7.9 g), wheat germ, salt.",1],["<span class=\"allergen\">wheat  flour</span>, palm oil, glucose syrup,  barley  malt extract, raising agents (ammonium carbonates, sodium carbonates), salt,  <span class=\"allergen\">eggs</span> , flavouring, flour treatment agent (sodium  metabisulfite ),",1],["cocoa mass, sugar, cocoa butter, vanilla,",1],["Farine de ma\u00efs* (70%), farine de riz*, sel marin. * K issus de l'agriculture biologique. \u2022 sans sucres ajout\u00e9s(\u00b9) (contient des sucres naturellement pr\u00e9sents.",1]]},"kind":"categorical","n":50,"n_null":8,"n_unique":36,"null_rate":0.16,"stats":{"cardinality":36,"entropy":4.92442493576916,"entropy_ratio":0.9525138052090384,"top_rate":0.16666666666666666,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"removed_countries_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"amino_acids_prev_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"50 singleton categories"}],"column":"code","extras":{"singletons":50,"top_values":[["6111242100992",1],["7622210449283",1],["3046920029759",1],["6111031005064",1],["3175680011480",1],["20995553",1],["3268840001008",1],["3362600011044",1],["8425197712024",1],["7622210578464",1],["6111259343108",1],["3362600011228",1],["8000500310427",1],["7300400481595",1],["3046920022651",1],["5060042641000",1],["7622210584724",1],["3046920022606",1],["3229820100234",1],["20022464",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":50,"null_rate":0.0,"stats":{"cardinality":50,"entropy":5.643856189774725,"entropy_ratio":1.0000000000000002,"top_rate":0.02,"top_value":"6111242100992"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"correctors","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"generic_name_ja","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"33 singleton categories"}],"column":"generic_name_fr","extras":{"singletons":33,"top_values":[["",14],["Perly fromage frais",1],["BISCUITS FOURR\u00c9S (35%) PARFUM CHOCOLAT",1],["Chocolat noir extra-fin traditionnel \u00e0 90% de cacao",1],["Biscuits au s\u00e9same",1],["Chocolat noir, 85% de cacao",1],["Eau de source",1],["Succ\u00e9dan\u00e9 de chocolat au lait avec amandes",1],["Sabl\u00e9 coco",1],["Biscuit fourr\u00e9 \u00e0 la p\u00e2te \u00e0 tartiner aux noisettes et au cacao Nutella\u00ae",1],["Pain croustillant a la farine de seigle",1],["Chocolat noir extra-fin traditionnel",1],["Chips de pommes de terre l\u00e9g\u00e8rement sal\u00e9es au sel de mer",1],["Chocolat noir extra fin, traditionnel",1],["go\u00fbters fourr\u00e9s au chocolat noir",1],["Edelbitter-Schokolade 74% Kakao",1],["Pain croustillant \u00e0 la farine compl\u00e8te de seigle, avoine et s\u00e9same.",1],["Crackers",1],["Chocolat noir extra-fin",1],["Biscuits aux pommes et aux noisettes, tr\u00e8s pauvres en sel, riches en vitamines B1, B2, B9 et E et source de vitamines PP et B6",1]]},"kind":"categorical","n":50,"n_null":3,"n_unique":34,"null_rate":0.06,"stats":{"cardinality":34,"entropy":4.420483130213672,"entropy_ratio":0.8688973793324563,"top_rate":0.2978723404255319,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"90.0% null"}],"column":"generic_name_pl","extras":{"singletons":1,"top_values":[["",4],["Wy\u015bmienita czkolada gorzka 70% kakao",1]]},"kind":"categorical","n":50,"n_null":45,"n_unique":2,"null_rate":0.9,"stats":{"cardinality":2,"entropy":0.7219280948873623,"entropy_ratio":0.7219280948873623,"top_rate":0.8,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"amino_acids_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"ingredients_debug","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_with_allergens_ja","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"data_quality_info_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"last_edit_dates_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"19 singleton categories"}],"column":"last_modified_by","extras":{"singletons":19,"top_values":[["foodless",21],["municorn-calorie-counter-app",3],["charlesnepote",2],["macrofactor",2],["bodysupport",2],["moon-rabbit",1],["gmlaa",1],["prepperapp",1],["marmotte73",1],["laura-chaud",1],["org-barilla-france-sa",1],["tom1707",1],["bubu63",1],["moncoachigbas",1],["natrius",1],["clxtng",1],["roboto-app",1],["fgouget",1],["ludolm",1],["foodiq",1]]},"kind":"categorical","n":50,"n_null":1,"n_unique":24,"null_rate":0.02,"stats":{"cardinality":24,"entropy":3.512800591451587,"entropy_ratio":0.7661568858849049,"top_rate":0.42857142857142855,"top_value":"foodless"}},{"alerts":[{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"no_nutrition_data","extras":{"singletons":0,"top_values":[["",48]]},"kind":"categorical","n":50,"n_null":2,"n_unique":1,"null_rate":0.04,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"nutriscore","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_nb","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"17 singleton categories"}],"column":"origins","extras":{"singletons":17,"top_values":[["",24],["France",4],["Maroc",3],["Morocco",1],["France,Union europ\u00e9enne,Non Union Europ\u00e9enne",1],["France,Provence-Alpes-C\u00f4te d'Azur,Italie,Vaucluse,en:Cairanne,en:Chambon-la-For\u00eat,en:Source Emma,en:Source Of\u00e9lia,en:Source Sainte C\u00e9cile,en:Source \u00c9l\u00e9na,en:Source \u00c9l\u00e9onore",1],["United Kingdom",1],["en:Madagarcar vanilla",1],["France,European Union and Non European Union",1],["Germany,Ludwig Weinrich,Ludwig Weinrich in Germany",1],["Su\u00e8de,Allemagne,Bi\u00e9lorussie,Estonie,Lettonie,Pologne,Seigle",1],["European Union and Non European Union",1],["\u00c9quateur",1],["Espa\u00f1a",1],["France,Non Union Europ\u00e9enne,Non indiqu\u00e9",1],["madagascar, fr:afrique, am\u00e9rique-du-sud",1],["fr:maroc",1],["Unspecified",1],["Farine \u0153uf France",1],["European Union",1]]},"kind":"categorical","n":50,"n_null":2,"n_unique":20,"null_rate":0.04,"stats":{"cardinality":20,"entropy":3.0267544273988385,"entropy_ratio":0.7003250310849333,"top_rate":0.5,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"nova_groups_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"languages","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"nutriscore_2023_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"packaging_materials_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[],"column":"lang","extras":{"singletons":2,"top_values":[["fr",35],["en",10],["de",3],["bg",1],["ro",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":5,"null_rate":0.0,"stats":{"cardinality":5,"entropy":1.2938747088925062,"entropy_ratio":0.557241506204038,"top_rate":0.7,"top_value":"fr"}},{"alerts":[{"code":"null_rate","level":"warn","message":"92.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_sv","extras":{"singletons":0,"top_values":[["",4]]},"kind":"categorical","n":50,"n_null":46,"n_unique":1,"null_rate":0.92,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"photographers","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"languages_codes","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[],"column":"ecoscore_grade","extras":{"singletons":2,"top_values":[["e",12],["d",9],["b",8],["c",8],["unknown",6],["a",3],["a-plus",2],["not-applicable",1],["f",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":9,"null_rate":0.0,"stats":{"cardinality":9,"entropy":2.807585439212223,"entropy_ratio":0.88569459464649,"top_rate":0.24,"top_value":"e"}},{"alerts":[],"column":"ingredients_n","extras":{"histogram":{"counts":[18,9,13,6,2,0,2],"edges":[1.0,6.428571428571429,11.857142857142858,17.285714285714285,22.714285714285715,28.142857142857146,33.57142857142857,39.0]},"sample":[5.0,19.0,5.0,16.0,22.0,7.0,1.0,9.0,8.0,4.0,5.0,12.0,34.0,4.0,4.0,3.0,5.0,5.0,14.0,9.0,6.0,8.0,17.0,12.0,4.0,20.0,3.0,22.0,5.0,6.0,8.0,14.0,12.0,14.0,3.0,7.0,25.0,20.0,10.0,17.0,21.0,13.0,5.0,9.0,6.0,16.0,39.0,12.0,26.0,14.0]},"kind":"numeric","n":50,"n_null":0,"n_unique":22,"null_rate":0.0,"stats":{"iqr":11.0,"kurtosis":1.4350606813269158,"max":39.0,"mean":11.7,"median":9.0,"min":1.0,"n_outliers":2,"outlier_rate":0.04,"q1":5.0,"q3":16.0,"skew":1.2372884444613748,"std":8.244354902301454,"zero_rate":0.0}},{"alerts":[],"column":"allergens","extras":{"singletons":7,"top_values":[["",16],["en:soybeans",5],["en:gluten",5],["en:gluten,en:milk,en:soybeans",4],["en:milk,en:nuts,en:soybeans",4],["en:gluten,en:milk",3],["en:eggs,en:gluten,en:milk,en:soybeans",2],["en:milk",2],["en:eggs,en:gluten,en:milk",2],["en:banana,en:milk",1],["en:gluten,en:milk,en:nuts,en:soybeans",1],["en:gluten,en:sesame-seeds",1],["en:eggs,en:gluten,en:sulphur-dioxide-and-sulphites",1],["en:gluten,en:nuts",1],["en:eggs,en:gluten",1],["en:nuts,en:sulphur-dioxide-and-sulphites",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":16,"null_rate":0.0,"stats":{"cardinality":16,"entropy":3.3643728207539825,"entropy_ratio":0.8410932051884956,"top_rate":0.32,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"minerals_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"48 singleton categories"}],"column":"product_name","extras":{"singletons":48,"top_values":[["Henry\u2019s",2],["Perly",1],["Prince Go\u00fbt Chocolat",1],["Excellence Noir Prodigieux 90% Cacao",1],["Tonik",1],["S\u00e9same",1],["\u0428\u043e\u043a\u043e\u043b\u0430\u0434 85% \u043a\u0430\u043a\u0430\u043e\u0432\u0430 \u043c\u0430\u0441\u0430",1],["CRISTALINE Eau De Source 0.5L",1],["",1],["Organic 70% Dark Chocolate Bar",1],["KING COOKIES",1],["Sable coco Henry s 42g",1],["Biscuits croquants au coeur onctueux de Nutella\u00ae",1],["Tartine croustillante Authentique",1],["Excellence Noir Intense 70% Cacao",1],["Lightly sea salted crisps",1],["Dark chocolate",1],["Excellence Noir Puissant 85% Cacao",1],["Fourr\u00e9s Chocolat Noir",1],["Extra dark 74% Cocoa",1]]},"kind":"categorical","n":50,"n_null":0,"n_unique":49,"null_rate":0.0,"stats":{"cardinality":49,"entropy":5.603856189774725,"entropy_ratio":0.9980669251587668,"top_rate":0.04,"top_value":"Henry\u2019s"}},{"alerts":[{"code":"long_tail","level":"info","message":"29 singleton categories"}],"column":"purchase_places","extras":{"singletons":29,"top_values":[["France",9],["",6],["Maroc",5],["Casablanca,Morocco",1],["F-77480 Mousseaux-les-Bray,France",1],["Madrid,Espa\u00f1a,Montargis,France,W\u00fcrzburg,Deutschland,Italia,Singapore,R\u00e9publique tch\u00e8que,Toronto,Burlington,Oakville",1],["France,Lacaune",1],["Slovenija,Finland,United Kingdom",1],["Villeurbanne,France,Toulon",1],["Lund,Sweden",1],["Fez,Morocco",1],["Italien,France,Lacaune,Portugal",1],["Bar-le-Duc,France",1],["France,R\u00e9publique tch\u00e8que,Lacaune",1],["France,United Kingdom",1],["Veynes,France,Trignac",1],["Morocco",1],["France,Belgique,Espagne,Estonie",1],["Espa\u00f1a,France,Serbia,Praha,Czechia",1],["France,Normandie",1]]},"kind":"categorical","n":50,"n_null":1,"n_unique":32,"null_rate":0.02,"stats":{"cardinality":32,"entropy":4.479021262651034,"entropy_ratio":0.8958042525302068,"top_rate":0.1836734693877551,"top_value":"France"}},{"alerts":[{"code":"long_tail","level":"info","message":"28 singleton categories"}],"column":"quantity","extras":{"singletons":28,"top_values":[["100 g",6],["100g",3],["125g",2],["42g",2],["90g",2],["",2],["100 gram",2],["230 g",2],["300 g",1],["22 g",1],["230g",1],["500 ml",1],["150 g",1],["304 g",1],["275 g",1],["150g",1],["225 g",1],["85 g",1],["36 g",1],["52",1]]},"kind":"categorical","n":50,"n_null":1,"n_unique":36,"null_rate":0.02,"stats":{"cardinality":36,"entropy":4.956247343982751,"entropy_ratio":0.958669099184234,"top_rate":0.12244897959183673,"top_value":"100 g"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"traces_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_uk","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"80.0% null"}],"column":"generic_name_ar","extras":{"singletons":1,"top_values":[["",9],["\u0627\u0644\u0627\u0645\u064a\u0631",1]]},"kind":"categorical","n":50,"n_null":40,"n_unique":2,"null_rate":0.8,"stats":{"cardinality":2,"entropy":0.4689955935892812,"entropy_ratio":0.4689955935892812,"top_rate":0.9,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_uk","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"78.0% null"}],"column":"ingredients_text_ar","extras":{"singletons":1,"top_values":[["",10],["\u0633\u0643\u0631\u060c\u062f\u0642\u064a\u0642\u060c\u062f\u0647\u0648\u0646 \u0646\u0628\u0627\u062a\u064a\u0629 (\u0646\u062e\u064a\u0644\u060c\u0634\u064a\u0627)\u060c\u0645\u0633\u062d\u0648\u0642 \u0643\u0627\u0643\u0627\u0648\u060c\u0634\u0631\u0627\u0628 \u062c\u0644\u0648\u0643\u0648\u0632\u060c\u0646\u0634\u0627 \u0627\u0644\u0630\u0631\u0629\u060c\u0645\u0633\u062d\u0648\u0642 \u062d\u0644\u064a\u0628\u060c\u0645\u0633\u062d\u0648\u0642 \u0645\u0635\u0644 \u0627\u0644\u0644\u0628\u0646\u060c\u0645\u0633\u062d\u0648\u0642 \u062d\u0644\u064a\u0628 \u0643\u0627\u0645\u0644 \u0627\u0644\u062f\u0633\u0645\u060c\u0639\u062c\u064a\u0646\u0629 \u0627\u0644\u0643\u0627\u0643\u0627\u0648\u060c\u0645\u0648\u0627\u062f \u0631\u0627\u0641\u0639\u0629(\u0628\u0643\u0631\u0628\u0648\u0646\u0627\u062a \u0627\u0644\u0635\u0648\u062f\u064a\u0648\u0645 \u0648 \u0627\u0644\u0623\u0645\u0648\u0646\u064a\u0648\u0645)\u060c\u0645\u0644\u062d\u060c\u0645\u0633\u062a\u062d\u0644\u0628(\u0644\u0633\u064a\u062a\u064a\u0646 \u0627\u0644\u0635\u0648\u064a\u0627(E322)\u0648\u06a4\u0627\u0646\u064a\u0644\u064a\u0646",1]]},"kind":"categorical","n":50,"n_null":39,"n_unique":2,"null_rate":0.78,"stats":{"cardinality":2,"entropy":0.4394969869215134,"entropy_ratio":0.4394969869215134,"top_rate":0.9090909090909091,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_uk","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"last_check_dates_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"null_rate","level":"warn","message":"86.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"checked","extras":{"singletons":0,"top_values":[["on",7]]},"kind":"categorical","n":50,"n_null":43,"n_unique":1,"null_rate":0.86,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"on"}},{"alerts":[{"code":"null_rate","level":"warn","message":"80.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_ar","extras":{"singletons":0,"top_values":[["",10]]},"kind":"categorical","n":50,"n_null":40,"n_unique":1,"null_rate":0.8,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"62.0% null"}],"column":"carbon_footprint_percent_of_known_ingredients","extras":{"histogram":{"counts":[3,2,3,8,3],"edges":[8.0,27.4,46.8,66.19999999999999,85.6,105.0]},"sample":[50.0,55.1,85.0,41.0,105.0,79.0,98.0,18.4,30.0,73.7,70.0,13.0,77.6,52.0,69.0,75.0,8.0,76.0,98.3]},"kind":"numeric","n":50,"n_null":31,"n_unique":19,"null_rate":0.62,"stats":{"iqr":32.8,"kurtosis":-0.8082846077355375,"max":105.0,"mean":61.79473684210526,"median":70.0,"min":8.0,"n_outliers":0,"outlier_rate":0.0,"q1":45.5,"q3":78.3,"skew":-0.4493067182896219,"std":28.975765231659263,"zero_rate":0.0}},{"alerts":[{"code":"null_rate","level":"warn","message":"86.0% null"}],"column":"last_checker","extras":{"singletons":2,"top_values":[["aleene",3],["moon-rabbit",2],["beniben",1],["sebleouf",1]]},"kind":"categorical","n":50,"n_null":43,"n_unique":4,"null_rate":0.86,"stats":{"cardinality":4,"entropy":1.8423709931771088,"entropy_ratio":0.9211854965885544,"top_rate":0.42857142857142855,"top_value":"aleene"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"product_name_uk","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"generic_name_uk","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"5 singleton categories"},{"code":"null_rate","level":"warn","message":"78.0% null"}],"column":"product_name_ar","extras":{"singletons":5,"top_values":[["",6],["\u0628\u0631\u0646\u0633",1],["Tonjik",1],["Leche Y Almendras",1],["Eyoo cover",1],["Chocolate Negro 92% Cacao",1]]},"kind":"categorical","n":50,"n_null":39,"n_unique":6,"null_rate":0.78,"stats":{"cardinality":6,"entropy":2.049452072789394,"entropy_ratio":0.7928362876512272,"top_rate":0.5454545454545454,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"14 singleton categories"},{"code":"null_rate","level":"warn","message":"72.0% null"}],"column":"carbon_footprint_from_known_ingredients_debug","extras":{"singletons":14,"top_values":[["en:cereal 50% x 0.3 = 15 g - ",1],["en:wheat-flour 55.1% x 1.2 = 66.12 g - ",1],["en:wheat-flour 32% x 1.2 = 38.4 g - en:cane-sugar 9% x 1.3 = 11.7 g - ",1],["en:wholemeal-rye-flour 77% x 1.2 = 92.4 g - en:rye-flour 28% x 1.2 = 33.6 g - ",1],["en:wheat-flour 39% x 1.2 = 46.8 g - en:dark-chocolate 25% x 4.9 = 122.5 g - en:whole-wheat-flour 15% x 1.2 = 18 g - ",1],["en:wholemeal-rye-flour 59% x 1.2 = 70.8 g - en:wheat-bran 27% x 0.6 = 16.2 g - en:oat-flakes 12% x 0.3 = 3.6 g - ",1],["en:wheat-flour 68.5% x 1.2 = 82.2 g - en:wheat-germ 5.2% x 0.6 = 3.12 g - ",1],["en:hazelnut-oil 13% x 2.6 = 33.8 g - ",1],["en:whole-wheat-flour 26.5% x 1.2 = 31.8 g - en:wheat-flour 26.1% x 1.2 = 31.32 g - en:wheat-bran 19.9% x 0.6 = 11.94 g - en:fig-paste 5.1% x 0.3 = 1.53 g - ",1],["en:wheat-flour 41% x 1.2 = 49.2 g - en:fresh-egg 11% x 2.6 = 28.6 g - ",1],["en:walnut-kernel 25% x 1.3 = 32.5 g - en:almond 25% x 5.9 = 147.5 g - en:cranberry 25% x 0.3 = 7.5 g - ",1],["en:whole-fresh-eggs 8% x 2.6 = 20.8 g - ",1],["en:wheat-flour 37% x 1.2 = 44.4 g - en:milk-chocolate 27% x 5.9 = 159.3 g - en:whole-wheat-flour 12% x 1.2 = 14.4 g - ",1],["en:cereal 98.3% x 0.3 = 29.49 g - ",1]]},"kind":"categorical","n":50,"n_null":36,"n_unique":14,"null_rate":0.72,"stats":{"cardinality":14,"entropy":3.8073549220576055,"entropy_ratio":1.0000000000000004,"top_rate":0.07142857142857142,"top_value":"en:cereal 50% x 0.3 = 15 g - "}},{"alerts":[{"code":"null_rate","level":"warn","message":"86.0% null"}],"column":"last_checked_t","extras":{"histogram":{"counts":[4,1,0,0,2],"edges":[1540933974.0,1578792448.0,1616650922.0,1654509396.0,1692367870.0,1730226344.0]},"sample":[1540933974.0,1730226344.0,1599127602.0,1564679969.0,1704302843.0,1548146220.0,1563262266.0]},"kind":"numeric","n":50,"n_null":43,"n_unique":7,"null_rate":0.86,"stats":{"iqr":96010979.5,"kurtosis":-1.1027328950074335,"max":1730226344.0,"mean":1607239888.2857144,"median":1564679969.0,"min":1540933974.0,"n_outliers":0,"outlier_rate":0.0,"q1":1555704243.0,"q3":1651715222.5,"skew":0.810558812923924,"std":77724522.67254399,"zero_rate":0.0}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_with_allergens_uk","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"82.0% null"}],"column":"ingredients_text_with_allergens_ar","extras":{"singletons":1,"top_values":[["",8],["\u0633\u0643\u0631\u060c\u062f\u0642\u064a\u0642\u060c\u062f\u0647\u0648\u0646 \u0646\u0628\u0627\u062a\u064a\u0629 (\u0646\u062e\u064a\u0644\u060c\u0634\u064a\u0627)\u060c\u0645\u0633\u062d\u0648\u0642 \u0643\u0627\u0643\u0627\u0648\u060c\u0634\u0631\u0627\u0628 \u062c\u0644\u0648\u0643\u0648\u0632\u060c\u0646\u0634\u0627 \u0627\u0644\u0630\u0631\u0629\u060c\u0645\u0633\u062d\u0648\u0642 \u062d\u0644\u064a\u0628\u060c\u0645\u0633\u062d\u0648\u0642 \u0645\u0635\u0644 \u0627\u0644\u0644\u0628\u0646\u060c\u0645\u0633\u062d\u0648\u0642 \u062d\u0644\u064a\u0628 \u0643\u0627\u0645\u0644 \u0627\u0644\u062f\u0633\u0645\u060c\u0639\u062c\u064a\u0646\u0629 \u0627\u0644\u0643\u0627\u0643\u0627\u0648\u060c\u0645\u0648\u0627\u062f \u0631\u0627\u0641\u0639\u0629(\u0628\u0643\u0631\u0628\u0648\u0646\u0627\u062a \u0627\u0644\u0635\u0648\u062f\u064a\u0648\u0645 \u0648 \u0627\u0644\u0623\u0645\u0648\u0646\u064a\u0648\u0645)\u060c\u0645\u0644\u062d\u060c\u0645\u0633\u062a\u062d\u0644\u0628(\u0644\u0633\u064a\u062a\u064a\u0646 \u0627\u0644\u0635\u0648\u064a\u0627(E322)\u0648\u06a4\u0627\u0646\u064a\u0644\u064a\u0646",1]]},"kind":"categorical","n":50,"n_null":41,"n_unique":2,"null_rate":0.82,"stats":{"cardinality":2,"entropy":0.5032583347756457,"entropy_ratio":0.5032583347756457,"top_rate":0.8888888888888888,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"80.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_ar","extras":{"singletons":0,"top_values":[["",10]]},"kind":"categorical","n":50,"n_null":40,"n_unique":1,"null_rate":0.8,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"nutriments_estimated","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"null_rate","level":"warn","message":"70.0% null"},{"code":"constant","level":"info","message":"only one distinct value"}],"column":"nutrition_score_warning_no_fiber","extras":{"histogram":{"counts":[0,0,15,0,0],"edges":[0.5,0.7,0.9,1.1,1.3,1.5]},"sample":[1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0]},"kind":"numeric","n":50,"n_null":35,"n_unique":1,"null_rate":0.7,"stats":{"iqr":0.0,"kurtosis":0.0,"max":1.0,"mean":1.0,"median":1.0,"min":1.0,"n_outliers":0,"outlier_rate":0.0,"q1":1.0,"q3":1.0,"skew":0.0,"std":0.0,"zero_rate":0.0}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"ingredients_text_debug_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"taxonomies_enhancer_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"null_rate","level":"warn","message":"68.0% null"}],"column":"completed_t","extras":{"histogram":{"counts":[1,5,4,1,5],"edges":[1628199203.0,1655198448.6,1682197694.2,1709196939.8,1736196185.4,1763195431.0]},"sample":[1686752676.0,1667313786.0,1663425082.0,1717001935.0,1740146101.0,1763195431.0,1706704378.0,1659852565.0,1757100827.0,1628199203.0,1741976102.0,1699482126.0,1739311856.0,1663104260.0,1707990172.0,1660410134.0]},"kind":"numeric","n":50,"n_null":34,"n_unique":16,"null_rate":0.68,"stats":{"iqr":76175540.75,"kurtosis":-1.1548795045758524,"max":1763195431.0,"mean":1700122914.625,"median":1703093252.0,"min":1628199203.0,"n_outliers":0,"outlier_rate":0.0,"q1":1663344876.5,"q3":1739520417.25,"skew":0.001246782415800225,"std":40701027.20630235,"zero_rate":0.0}},{"alerts":[{"code":"long_tail","level":"info","message":"3 singleton categories"},{"code":"null_rate","level":"warn","message":"94.0% null"}],"column":"product_name_bg","extras":{"singletons":3,"top_values":[["\u0428\u043e\u043a\u043e\u043b\u0430\u0434 85% \u043a\u0430\u043a\u0430\u043e\u0432\u0430 \u043c\u0430\u0441\u0430",1],["\u0422\u044a\u043c\u0435\u043d \u0448\u043e\u043a\u043e\u043b\u0430\u0434 74% \u043a\u0430\u043a\u0430\u043e",1],["\u041b\u0435\u0448\u043d\u0438\u043a\u043e\u0432\u043e-\u043a\u0430\u043a\u0430\u043e\u0432 \u043a\u0440\u0435\u043c",1]]},"kind":"categorical","n":50,"n_null":47,"n_unique":3,"null_rate":0.94,"stats":{"cardinality":3,"entropy":1.584962500721156,"entropy_ratio":1.0,"top_rate":0.3333333333333333,"top_value":"\u0428\u043e\u043a\u043e\u043b\u0430\u0434 85% \u043a\u0430\u043a\u0430\u043e\u0432\u0430 \u043c\u0430\u0441\u0430"}},{"alerts":[{"code":"long_tail","level":"info","message":"3 singleton categories"},{"code":"null_rate","level":"warn","message":"94.0% null"}],"column":"ingredients_text_et","extras":{"singletons":3,"top_values":[["kakavova masa, manjmasten kakavov prah, kakavovo maslo, sladkor, emulgator: lecitini (_sojin_ lecitin); ekstrakt vanilije.",1],["Kakaomasse*, Zucker, Kakaobutter, Kakaopulver stark ent\u00f6it, Emulgator: Sonnenblumenlecithine (E-322), nat\u00fcrliches Vanille-Aroma, \r\n* Rainforest Alliance Certified,\r\nKakao: 74% mindestens,",1],["Kakaomass, suhkur, kakaovoi, vanill.",1]]},"kind":"categorical","n":50,"n_null":47,"n_unique":3,"null_rate":0.94,"stats":{"cardinality":3,"entropy":1.584962500721156,"entropy_ratio":1.0,"top_rate":0.3333333333333333,"top_value":"kakavova masa, manjmasten kakavov prah, kakavovo maslo, sladkor, emulgator: lecitini (_sojin_ lecitin); ekstrakt vanilije."}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_sl","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"generic_name_dz","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_sl","extras":{"singletons":1,"top_values":[["Kakavova masa, manjmasten kakavov prah, kakavovo maslo, sladkor, emulgator: lecitini (sojin lecitin); ekstrakt vanilije. Lahko vsebuje sledi ore\u0161kov (le\u0161niki, mandlji, pistacija) in mleka. Uporabno najmanj do: glej odtis na zadnji strani embala\u017ee.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Kakavova masa, manjmasten kakavov prah, kakavovo maslo, sladkor, emulgator: lecitini (sojin lecitin); ekstrakt vanilije. Lahko vsebuje sledi ore\u0161kov (le\u0161niki, mandlji, pistacija) in mleka. Uporabno najmanj do: glej odtis na zadnji strani embala\u017ee."}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"generic_name_ca","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_dz","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"product_name_ca","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_ca","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"3 singleton categories"},{"code":"null_rate","level":"warn","message":"94.0% null"}],"column":"product_name_et","extras":{"singletons":3,"top_values":[["Chocolat noir - 85% cacao",1],["",1],["Excellence 70% Cocoa Intense Dark",1]]},"kind":"categorical","n":50,"n_null":47,"n_unique":3,"null_rate":0.94,"stats":{"cardinality":3,"entropy":1.584962500721156,"entropy_ratio":1.0,"top_rate":0.3333333333333333,"top_value":"Chocolat noir - 85% cacao"}},{"alerts":[{"code":"long_tail","level":"info","message":"3 singleton categories"},{"code":"null_rate","level":"warn","message":"94.0% null"}],"column":"ingredients_text_with_allergens_bg","extras":{"singletons":3,"top_values":[["\u041a\u0430\u043a\u0430\u043e\u0432\u0430 \u043c\u0430\u0441\u0430, \u043d\u0438\u0441\u043a\u043e\u043c\u0430\u0441\u043b\u0435\u043d\u043e \u043a\u0430\u043a\u0430\u043e \u043d\u0430 \u043f\u0440\u0430\u0445, \u043a\u0430\u043a\u0430\u043e\u0432\u043e \u043c\u0430\u0441\u043b\u043e, \u0437\u0430\u0445\u0430\u0440, \u0435\u043c\u0443\u043b\u0433\u0430\u0442\u043e\u0440: \u043b\u0435\u0446\u0438\u0442\u0438\u043d (<span class=\"allergen\">\u0441\u043e\u0435\u0432\u0438</span>), \u0435\u043a\u0441\u0442\u0440\u0430\u043a\u0442 \u043e\u0442 \u0432\u0430\u043d\u0438\u043b\u0438\u044f, \u041c\u043e\u0436\u0435 \u0434\u0430 \u0441\u044a\u0434\u044a\u0440\u0436\u0430 \u0441\u043b\u0435\u0434\u0438 \u043e\u0442 \u044f\u0434\u043a\u0438 \u0438 \u043c\u043b\u044f\u043a\u043e,",1],["",1],["\u0417\u0430\u0445\u0430\u0440, \u043f\u0430\u043b\u043c\u043e\u0432\u043e \u043c\u0430\u0441\u043b\u043e, <span class=\"allergen\">\u041b\u0415\u0428\u041d\u0418\u0426\u0418</span> (13%), \u043e\u0431\u0435\u0437\u043c\u0430\u0441\u043b\u0435\u043d\u043e \u041c\u041b\u042f\u041a\u041e \u043d\u0430 \u043f\u0440\u0430\u0445 (8,7%), \u043d\u0438\u0441\u043a\u043e\u043c\u0430\u0441\u043b\u0435\u043d\u043e \u043a\u0430\u043a\u0430\u043e \u043d\u0430 \u043f\u0440\u0430\u0445 (7,4%), \u0435\u043c\u0443\u043b\u0433\u0430\u0442\u043e\u0440: \u043b\u0435\u0446\u0438\u0442\u0438\u043d\u0438 (<span class=\"allergen\">\u0421\u041e\u042f</span>), \u0432\u0430\u043d\u0438\u043b\u0438\u043d.",1]]},"kind":"categorical","n":50,"n_null":47,"n_unique":3,"null_rate":0.94,"stats":{"cardinality":3,"entropy":1.584962500721156,"entropy_ratio":1.0,"top_rate":0.3333333333333333,"top_value":"\u041a\u0430\u043a\u0430\u043e\u0432\u0430 \u043c\u0430\u0441\u0430, \u043d\u0438\u0441\u043a\u043e\u043c\u0430\u0441\u043b\u0435\u043d\u043e \u043a\u0430\u043a\u0430\u043e \u043d\u0430 \u043f\u0440\u0430\u0445, \u043a\u0430\u043a\u0430\u043e\u0432\u043e \u043c\u0430\u0441\u043b\u043e, \u0437\u0430\u0445\u0430\u0440, \u0435\u043c\u0443\u043b\u0433\u0430\u0442\u043e\u0440: \u043b\u0435\u0446\u0438\u0442\u0438\u043d (<span class=\"allergen\">\u0441\u043e\u0435\u0432\u0438</span>), \u0435\u043a\u0441\u0442\u0440\u0430\u043a\u0442 \u043e\u0442 \u0432\u0430\u043d\u0438\u043b\u0438\u044f, \u041c\u043e\u0436\u0435 \u0434\u0430 \u0441\u044a\u0434\u044a\u0440\u0436\u0430 \u0441\u043b\u0435\u0434\u0438 \u043e\u0442 \u044f\u0434\u043a\u0438 \u0438 \u043c\u043b\u044f\u043a\u043e,"}},{"alerts":[{"code":"long_tail","level":"info","message":"3 singleton categories"},{"code":"null_rate","level":"warn","message":"94.0% null"}],"column":"ingredients_text_with_allergens_et","extras":{"singletons":3,"top_values":[["kakavova masa, manjmasten kakavov prah, kakavovo maslo, sladkor, emulgator: lecitini (<span class=\"allergen\">sojin</span> lecitin); ekstrakt vanilije.",1],["Kakaomasse*, Zucker, Kakaobutter, Kakaopulver stark ent\u00f6it, Emulgator: Sonnenblumenlecithine (E-322), nat\u00fcrliches Vanille-Aroma, \r\n* Rainforest Alliance Certified,\r\nKakao: 74% mindestens,",1],["Kakaomass, suhkur, kakaovoi, vanill.",1]]},"kind":"categorical","n":50,"n_null":47,"n_unique":3,"null_rate":0.94,"stats":{"cardinality":3,"entropy":1.584962500721156,"entropy_ratio":1.0,"top_rate":0.3333333333333333,"top_value":"kakavova masa, manjmasten kakavov prah, kakavovo maslo, sladkor, emulgator: lecitini (<span class=\"allergen\">sojin</span> lecitin); ekstrakt vanilije."}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_sk","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"94.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_bg","extras":{"singletons":0,"top_values":[["",3]]},"kind":"categorical","n":50,"n_null":47,"n_unique":1,"null_rate":0.94,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_sl","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"generic_name_sk","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_with_allergens_sl","extras":{"singletons":1,"top_values":[["Kakavova masa, manjmasten kakavov prah, kakavovo maslo, sladkor, emulgator: lecitini (sojin lecitin); ekstrakt vanilije. Lahko vsebuje sledi ore\u0161kov (<span class=\"allergen\">le\u0161niki</span>, <span class=\"allergen\">mandlji</span>, <span class=\"allergen\">pistacija</span>) in mleka. Uporabno najmanj do: glej odtis na zadnji strani embala\u017ee.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Kakavova masa, manjmasten kakavov prah, kakavovo maslo, sladkor, emulgator: lecitini (sojin lecitin); ekstrakt vanilije. Lahko vsebuje sledi ore\u0161kov (<span class=\"allergen\">le\u0161niki</span>, <span class=\"allergen\">mandlji</span>, <span class=\"allergen\">pistacija</span>) in mleka. Uporabno najmanj do: glej odtis na zadnji strani embala\u017ee."}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_ca","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"generic_name_sl","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"product_name_dz","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"94.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_et","extras":{"singletons":0,"top_values":[["",3]]},"kind":"categorical","n":50,"n_null":47,"n_unique":1,"null_rate":0.94,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_with_allergens_sk","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"product_name_sk","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"3 singleton categories"},{"code":"null_rate","level":"warn","message":"84.0% null"}],"column":"ingredients_text_with_allergens_pt","extras":{"singletons":3,"top_values":[["",5],["Creme para barrar de <span class=\"allergen\">AVELAS</span> </span>e cacau 40% (a\u00e7\u00facar, gordura de palma, <span class=\"allergen\">AVELAS</span> (13%), <span class=\"allergen\">LEITE</span> </span>desnatado em p\u00f3 (8,7%), cacau magro (7,4%), emulsionantes: lecitinas (<span class=\"allergen\">SOJA</span>), vanilina), farinha de <span class=\"allergen\">TRIGO</span> (32,5%), gorduras vegetais (palma, palmiste), a\u00e7\u00facar de cana (cont\u00e9m <span class=\"allergen\">TRIGO</span>) (8,5%), <span class=\"allergen\">LACTOSE</span>, farelo de <span class=\"allergen\">TRIGO</span>, <span class=\"allergen\">LEITE</span> </span>inteiro em p\u00f3, mel, levedantes qu\u00edmicos (difosfato diss\u00f3dico, hidrogenocarbonato de s\u00f3dio, hidrogenocarbonato de am\u00f3nio), farinha de <span class=\"allergen\">CEVADA</span> </span>maltada, cacau magro, sal, extrato em p\u00f3 de malte de <span class=\"allergen\">CEVADA</span> </span>e milho, amido de <span class=\"allergen\">TRIGO</span>, emulsionantes: lecitinas (<span class=\"allergen\">SOJA</span>), vanilina.",1],["Farinha de <span class=\"allergen\">TRIGO</span>, gordura de palma, xarope de glucose, extrato de <span class=\"allergen\">CEVADA</span> malteada, levedantes (carbonatos de am\u00f3nio, carbonatos de s\u00f3dio), sal, <span class=\"allergen\">OVOS</span>, aroma, agente de tratamento da farinha (<span class=\"allergen\">METABISSULFITO</span> de s\u00f3dio).",1],["Pasta de cacau, a\u00e7\u00facar, manteiga de cacau, baunilha.",1]]},"kind":"categorical","n":50,"n_null":42,"n_unique":4,"null_rate":0.84,"stats":{"cardinality":4,"entropy":1.5487949406953985,"entropy_ratio":0.7743974703476992,"top_rate":0.625,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_with_allergens_ca","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"80.0% null"}],"column":"generic_name_pt","extras":{"singletons":2,"top_values":[["",8],["Bolachas recheadas de creme para barrar de avel\u00e3s e cacau NUTELLA\u00ae",1],["Chocolate extrafino com 70% de cacau",1]]},"kind":"categorical","n":50,"n_null":40,"n_unique":3,"null_rate":0.8,"stats":{"cardinality":3,"entropy":0.9219280948873623,"entropy_ratio":0.5816718657178868,"top_rate":0.8,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"80.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_pt","extras":{"singletons":0,"top_values":[["",10]]},"kind":"categorical","n":50,"n_null":40,"n_unique":1,"null_rate":0.8,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"3 singleton categories"},{"code":"null_rate","level":"warn","message":"80.0% null"}],"column":"ingredients_text_pt","extras":{"singletons":3,"top_values":[["",7],["Creme para barrar de AVELAS e cacau 40% (a\u00e7\u00facar, gordura de palma, AVELAS (13%), LEITE desnatado em p\u00f3 (8,7%), cacau magro (7,4%), emulsionantes: lecitinas (SOJA), vanilina), farinha de TRIGO (32,5%), gorduras vegetais (palma, palmiste), a\u00e7\u00facar de cana (cont\u00e9m TRIGO) (8,5%), LACTOSE, farelo de TRIGO, LEITE inteiro em p\u00f3, mel, levedantes qu\u00edmicos (difosfato diss\u00f3dico, hidrogenocarbonato de s\u00f3dio, hidrogenocarbonato de am\u00f3nio), farinha de CEVADA maltada, cacau magro, sal, extrato em p\u00f3 de malte de CEVADA e milho, amido de TRIGO, emulsionantes: lecitinas (SOJA), vanilina.",1],["Farinha de _TRIGO_, gordura de palma, xarope de glucose, extrato de _CEVADA_ malteada, levedantes (carbonatos de am\u00f3nio, carbonatos de s\u00f3dio), sal, _OVOS_, aroma, agente de tratamento da farinha (_METABISSULFITO_ de s\u00f3dio).",1],["Pasta de cacau, a\u00e7\u00facar, manteiga de cacau, baunilha.",1]]},"kind":"categorical","n":50,"n_null":40,"n_unique":4,"null_rate":0.8,"stats":{"cardinality":4,"entropy":1.3567796494470397,"entropy_ratio":0.6783898247235198,"top_rate":0.7,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"80.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_pt","extras":{"singletons":0,"top_values":[["",10]]},"kind":"categorical","n":50,"n_null":40,"n_unique":1,"null_rate":0.8,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"constant","level":"info","message":"only one distinct value"}],"column":"nutrition_score_warning_nutriments_estimated","extras":{"histogram":{"counts":[0,0,2,0,0],"edges":[0.5,0.7,0.9,1.1,1.3,1.5]},"sample":[1.0,1.0]},"kind":"numeric","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"iqr":0.0,"kurtosis":0.0,"max":1.0,"mean":1.0,"median":1.0,"min":1.0,"n_outliers":0,"outlier_rate":0.0,"q1":1.0,"q3":1.0,"skew":0.0,"std":0.0,"zero_rate":0.0}},{"alerts":[{"code":"null_rate","level":"warn","message":"94.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_bg","extras":{"singletons":0,"top_values":[["",3]]},"kind":"categorical","n":50,"n_null":47,"n_unique":1,"null_rate":0.94,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"94.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"generic_name_et","extras":{"singletons":0,"top_values":[["",3]]},"kind":"categorical","n":50,"n_null":47,"n_unique":1,"null_rate":0.94,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_ca","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"product_name_sl","extras":{"singletons":1,"top_values":[["ARRIBA 85% cacao",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"ARRIBA 85% cacao"}},{"alerts":[{"code":"null_rate","level":"warn","message":"94.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"generic_name_bg","extras":{"singletons":0,"top_values":[["",3]]},"kind":"categorical","n":50,"n_null":47,"n_unique":1,"null_rate":0.94,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_sk","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"3 singleton categories"},{"code":"null_rate","level":"warn","message":"94.0% null"}],"column":"ingredients_text_bg","extras":{"singletons":3,"top_values":[["\u041a\u0430\u043a\u0430\u043e\u0432\u0430 \u043c\u0430\u0441\u0430, \u043d\u0438\u0441\u043a\u043e\u043c\u0430\u0441\u043b\u0435\u043d\u043e \u043a\u0430\u043a\u0430\u043e \u043d\u0430 \u043f\u0440\u0430\u0445, \u043a\u0430\u043a\u0430\u043e\u0432\u043e \u043c\u0430\u0441\u043b\u043e, \u0437\u0430\u0445\u0430\u0440, \u0435\u043c\u0443\u043b\u0433\u0430\u0442\u043e\u0440: \u043b\u0435\u0446\u0438\u0442\u0438\u043d (\u0441\u043e\u0435\u0432\u0438), \u0435\u043a\u0441\u0442\u0440\u0430\u043a\u0442 \u043e\u0442 \u0432\u0430\u043d\u0438\u043b\u0438\u044f, \u041c\u043e\u0436\u0435 \u0434\u0430 \u0441\u044a\u0434\u044a\u0440\u0436\u0430 \u0441\u043b\u0435\u0434\u0438 \u043e\u0442 \u044f\u0434\u043a\u0438 \u0438 \u043c\u043b\u044f\u043a\u043e,",1],["",1],["\u0417\u0430\u0445\u0430\u0440, \u043f\u0430\u043b\u043c\u043e\u0432\u043e \u043c\u0430\u0441\u043b\u043e, \u041b\u0415\u0428\u041d\u0418\u0426\u0418 (13%), \u043e\u0431\u0435\u0437\u043c\u0430\u0441\u043b\u0435\u043d\u043e \u041c\u041b\u042f\u041a\u041e \u043d\u0430 \u043f\u0440\u0430\u0445 (8,7%), \u043d\u0438\u0441\u043a\u043e\u043c\u0430\u0441\u043b\u0435\u043d\u043e \u043a\u0430\u043a\u0430\u043e \u043d\u0430 \u043f\u0440\u0430\u0445 (7,4%), \u0435\u043c\u0443\u043b\u0433\u0430\u0442\u043e\u0440: \u043b\u0435\u0446\u0438\u0442\u0438\u043d\u0438 (\u0421\u041e\u042f), \u0432\u0430\u043d\u0438\u043b\u0438\u043d.",1]]},"kind":"categorical","n":50,"n_null":47,"n_unique":3,"null_rate":0.94,"stats":{"cardinality":3,"entropy":1.584962500721156,"entropy_ratio":1.0,"top_rate":0.3333333333333333,"top_value":"\u041a\u0430\u043a\u0430\u043e\u0432\u0430 \u043c\u0430\u0441\u0430, \u043d\u0438\u0441\u043a\u043e\u043c\u0430\u0441\u043b\u0435\u043d\u043e \u043a\u0430\u043a\u0430\u043e \u043d\u0430 \u043f\u0440\u0430\u0445, \u043a\u0430\u043a\u0430\u043e\u0432\u043e \u043c\u0430\u0441\u043b\u043e, \u0437\u0430\u0445\u0430\u0440, \u0435\u043c\u0443\u043b\u0433\u0430\u0442\u043e\u0440: \u043b\u0435\u0446\u0438\u0442\u0438\u043d (\u0441\u043e\u0435\u0432\u0438), \u0435\u043a\u0441\u0442\u0440\u0430\u043a\u0442 \u043e\u0442 \u0432\u0430\u043d\u0438\u043b\u0438\u044f, \u041c\u043e\u0436\u0435 \u0434\u0430 \u0441\u044a\u0434\u044a\u0440\u0436\u0430 \u0441\u043b\u0435\u0434\u0438 \u043e\u0442 \u044f\u0434\u043a\u0438 \u0438 \u043c\u043b\u044f\u043a\u043e,"}},{"alerts":[{"code":"null_rate","level":"warn","message":"94.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_et","extras":{"singletons":0,"top_values":[["",3]]},"kind":"categorical","n":50,"n_null":47,"n_unique":1,"null_rate":0.94,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_sk","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"6 singleton categories"},{"code":"null_rate","level":"warn","message":"80.0% null"}],"column":"product_name_pt","extras":{"singletons":6,"top_values":[["",4],["Cioccolato Fondente 85% Cacao",1],["Crocantes bolachas com um cora\u00e7\u00e3o cremoso de Nutella\u00ae",1],["70% Cacao noir intense",1],["Excellence 70% Cocoa Intense Dark",1],["Original",1],["Mix com sultanas e arandos",1]]},"kind":"categorical","n":50,"n_null":40,"n_unique":7,"null_rate":0.8,"stats":{"cardinality":7,"entropy":2.5219280948873624,"entropy_ratio":0.8983289127685206,"top_rate":0.4,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"7 singleton categories"},{"code":"null_rate","level":"warn","message":"86.0% null"}],"column":"abbreviated_product_name_fr","extras":{"singletons":7,"top_values":[["CRISTALINE Eau De Source 0.5L",1],["Nutella biscuits t22",1],["Authentique 275g, fr",1],["Fibres 230g, fr",1],["ORG Original 175g",1],["NESTLE DESSERT Noir 205g",1],["BRIOCHE TRANCHEE BIO 400g",1]]},"kind":"categorical","n":50,"n_null":43,"n_unique":7,"null_rate":0.86,"stats":{"cardinality":7,"entropy":2.807354922057604,"entropy_ratio":1.0,"top_rate":0.14285714285714285,"top_value":"CRISTALINE Eau De Source 0.5L"}},{"alerts":[{"code":"null_rate","level":"warn","message":"86.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"obsolete_imported","extras":{"singletons":0,"top_values":[["0",7]]},"kind":"categorical","n":50,"n_null":43,"n_unique":1,"null_rate":0.86,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"0"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"sources_fields","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"emb_code","extras":{"singletons":1,"top_values":[["EMB 44068 A",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"EMB 44068 A"}},{"alerts":[{"code":"null_rate","level":"warn","message":"86.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"lang_imported","extras":{"singletons":0,"top_values":[["fr",7]]},"kind":"categorical","n":50,"n_null":43,"n_unique":1,"null_rate":0.86,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"fr"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"generic_name_zh","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"7 singleton categories"},{"code":"null_rate","level":"warn","message":"86.0% null"}],"column":"conservation_conditions_fr_imported","extras":{"singletons":7,"top_values":[["A conserver de pr\u00e9f\u00e9rence \u00e0 l'abri du soleil, dans un endroit propre, frais et sans odeur.",1],["A conserver au sec et \u00e0 l'abri de la chaleur. Ne pas mettre au r\u00e9frig\u00e9rateur.",1],["A conserver dans un endroit sec \u00e0 l'abri de la lumi\u00e8re.",1],["Conserver dans un endroit frais et sec.",1],["\u00c0 conserver dans un endroit sec",1],["A conserver au frais et au sec.",1],["\u00c0 conserver dans son emballage ferm\u00e9, dans un endroit sec, \u00e0 temp\u00e9rature ambiante.",1]]},"kind":"categorical","n":50,"n_null":43,"n_unique":7,"null_rate":0.86,"stats":{"cardinality":7,"entropy":2.807354922057604,"entropy_ratio":1.0,"top_rate":0.14285714285714285,"top_value":"A conserver de pr\u00e9f\u00e9rence \u00e0 l'abri du soleil, dans un endroit propre, frais et sans odeur."}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"96.0% null"}],"column":"origin_fr_imported","extras":{"singletons":2,"top_values":[["France",1],["P\u00e2te de cacao (Afrique de l'Ouest, Am\u00e9rique du Sud)\nAfrique, Europe, Madagascar, Am\u00e9rique du Sud, Afrique de l'Ouest",1]]},"kind":"categorical","n":50,"n_null":48,"n_unique":2,"null_rate":0.96,"stats":{"cardinality":2,"entropy":1.0,"entropy_ratio":1.0,"top_rate":0.5,"top_value":"France"}},{"alerts":[{"code":"long_tail","level":"info","message":"5 singleton categories"},{"code":"null_rate","level":"warn","message":"86.0% null"}],"column":"owner","extras":{"singletons":5,"top_values":[["org-barilla-france-sa",2],["org-gie-sources-alma",1],["org-ferrero-france-commerciale",1],["org-kellogg-s",1],["org-nestle-france",1],["org-la-boulangere-co",1]]},"kind":"categorical","n":50,"n_null":43,"n_unique":6,"null_rate":0.86,"stats":{"cardinality":6,"entropy":2.5216406363433186,"entropy_ratio":0.9755037590061086,"top_rate":0.2857142857142857,"top_value":"org-barilla-france-sa"}},{"alerts":[{"code":"long_tail","level":"info","message":"7 singleton categories"},{"code":"null_rate","level":"warn","message":"86.0% null"}],"column":"ingredients_text_fr_imported","extras":{"singletons":7,"top_values":[["Eau de Source",1],["P\u00e2te \u00e0 tartiner aux NOISETTES et au cacao 40% (sucre, huile de palme, NOISETTES 13%, LAIT \u00e9cr\u00e9m\u00e9 en poudre 8,7%, cacao maigre 7,4%, \u00e9mulsifiants : l\u00e9cithines [SOJA] ; vanilline), farine de FROMENT 32%, graisses v\u00e9g\u00e9tales (palme, palmiste), sucre de canne 8,5%, LACTOSE, son de BLE, LAIT en poudre, extrait en poudre de malt d'ORGE et de ma\u00efs, miel, poudres \u00e0 lever (disphosphate disodique, carbonate acide d'ammonium, carbonate acide de sodium), cacao maigre, sel, amidon de FROMENT, farine d'ORGE malt\u00e9, \u00e9mulsifiants : l\u00e9cithines [SOJA] ; vanilline.",1],["Farine compl\u00e8te de SEIGLE (77 g*), farine de SEIGLE (28 g*), levure, sel. Peut contenir des traces de LUPIN, LAIT, MOUTARDE, GRAINES DE S\u00c9SAME et SOJA. *en g pour 100 g de produit.",1],["Farine compl\u00e8te de SEIGLE 59 g*, son de BL\u00c9 27 g*, flocons d'AVOINE 12 g*, GRAINES DE S\u00c9SAME 7,0 g*, germe de BL\u00c9, sel. *en g pour 100 g de produit fini. Peut contenir des traces de LUPIN, LAIT, MOUTARDE et SOJA.",1],["Pommes de terre d\u00e9shydrat\u00e9es, huiles v\u00e9g\u00e9tales (tournesol, ma\u00efs), farine de riz, amidon de BL\u00c9, farine de ma\u00efs, \u00e9mulsifiant (E471), maltodextrine, sel, extrait de levure, levure en poudre, colorant (rocou).",1],["Sucre, p\u00e2te de cacao (Afrique de l'Ouest, Am\u00e9rique du Sud), beurre de cacao, \u00e9mulsifiant (l\u00e9cithine), ar\u00f4me naturel de vanille de Madagascar. Cacao : 53% minimum. Peut contenir : LAIT, FRUITS A COQUE.",1],["Farine de BL\u00c9*/** 54%, \u0152UFS entiers*/** 14%, sucre de canne roux*, huile de tournesol*/** 8%, levain* (eau, farines de BL\u00c9*/** 2% et de SEIGLE*, levures), GLUTEN DE BL\u00c9*, sel, levure, ar\u00f4me naturel de vanille* (contient alcool*), extrait de vanille*, levure d\u00e9sactiv\u00e9e. Traces \u00e9ventuelles de lait, moutarde et soja. *Ingr\u00e9dients issus de l'Agriculture Biologique. **Ingr\u00e9dients issus du commerce \u00e9quitable fran\u00e7ais.",1]]},"kind":"categorical","n":50,"n_null":43,"n_unique":7,"null_rate":0.86,"stats":{"cardinality":7,"entropy":2.807354922057604,"entropy_ratio":1.0,"top_rate":0.14285714285714285,"top_value":"Eau de Source"}},{"alerts":[{"code":"long_tail","level":"info","message":"5 singleton categories"},{"code":"null_rate","level":"warn","message":"86.0% null"}],"column":"owners_tags","extras":{"singletons":5,"top_values":[["org-barilla-france-sa",2],["org-gie-sources-alma",1],["org-ferrero-france-commerciale",1],["org-kellogg-s",1],["org-nestle-france",1],["org-la-boulangere-co",1]]},"kind":"categorical","n":50,"n_null":43,"n_unique":6,"null_rate":0.86,"stats":{"cardinality":6,"entropy":2.5216406363433186,"entropy_ratio":0.9755037590061086,"top_rate":0.2857142857142857,"top_value":"org-barilla-france-sa"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"product_name_zh","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"86.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"nutrition_data_prepared_per_imported","extras":{"singletons":0,"top_values":[["100g",7]]},"kind":"categorical","n":50,"n_null":43,"n_unique":1,"null_rate":0.86,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"100g"}},{"alerts":[{"code":"long_tail","level":"info","message":"7 singleton categories"},{"code":"null_rate","level":"warn","message":"86.0% null"}],"column":"abbreviated_product_name_fr_imported","extras":{"singletons":7,"top_values":[["CRISTALINE Eau De Source 0.5L",1],["Nutella biscuits t22",1],["Authentique 275g, fr",1],["Fibres 230g, fr",1],["ORG Original 175g",1],["NESTLE DESSERT Noir 205g",1],["BRIOCHE TRANCHEE BIO 400g",1]]},"kind":"categorical","n":50,"n_null":43,"n_unique":7,"null_rate":0.86,"stats":{"cardinality":7,"entropy":2.807354922057604,"entropy_ratio":1.0,"top_rate":0.14285714285714285,"top_value":"CRISTALINE Eau De Source 0.5L"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"generic_name_zh_debug_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"5 singleton categories"},{"code":"null_rate","level":"warn","message":"86.0% null"}],"column":"customer_service_fr","extras":{"singletons":5,"top_values":[["Service Consommateurs, : www.wasa.com/fr-fr/contact (depuis la France), www.wasa.com/fr-be/contact (depuis la Belgique)",2],["Service Consommateurs Cristaline, 70 avenue des Sources 03270 SAINT YORRE",1],["FERRERO FRANCE COMMERCIALE - Service Consommateurs, CS 90058 - 76136 MONT SAINT AIGNAN Cedex",1],["Service Conseil Consommateurs, Kellogg's Produits Alimentaires S.A.S. - Immeuble Neptune - 1 rue Galil\u00e9e 93160 Noisy-le-Grand (France)",1],["Nestl\u00e9 France, 34-40 rue Guynemer 92130 Issy-les-Moulineaux",1],["Service consommateurs La Boulang\u00e8re & Co, La Boulang\u00e8re & Co 1 rue du petit bocage CS 40 201 85140 ESSARTS",1]]},"kind":"categorical","n":50,"n_null":43,"n_unique":6,"null_rate":0.86,"stats":{"cardinality":6,"entropy":2.5216406363433186,"entropy_ratio":0.9755037590061086,"top_rate":0.2857142857142857,"top_value":"Service Consommateurs, : www.wasa.com/fr-fr/contact (depuis la France), www.wasa.com/fr-be/contact (depuis la Belgique)"}},{"alerts":[{"code":"long_tail","level":"info","message":"5 singleton categories"},{"code":"null_rate","level":"warn","message":"86.0% null"}],"column":"customer_service_fr_imported","extras":{"singletons":5,"top_values":[["Service Consommateurs, : www.wasa.com/fr-fr/contact (depuis la France), www.wasa.com/fr-be/contact (depuis la Belgique)",2],["Service Consommateurs Cristaline, 70 avenue des Sources 03270 SAINT YORRE",1],["FERRERO FRANCE COMMERCIALE - Service Consommateurs, CS 90058 - 76136 MONT SAINT AIGNAN Cedex",1],["Service Conseil Consommateurs, Kellogg's Produits Alimentaires S.A.S. - Immeuble Neptune - 1 rue Galil\u00e9e 93160 Noisy-le-Grand (France)",1],["Nestl\u00e9 France, 34-40 rue Guynemer 92130 Issy-les-Moulineaux",1],["Service consommateurs La Boulang\u00e8re & Co, La Boulang\u00e8re & Co 1 rue du petit bocage CS 40 201 85140 ESSARTS",1]]},"kind":"categorical","n":50,"n_null":43,"n_unique":6,"null_rate":0.86,"stats":{"cardinality":6,"entropy":2.5216406363433186,"entropy_ratio":0.9755037590061086,"top_rate":0.2857142857142857,"top_value":"Service Consommateurs, : www.wasa.com/fr-fr/contact (depuis la France), www.wasa.com/fr-be/contact (depuis la Belgique)"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"ingredients_text_zh_debug_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"7 singleton categories"},{"code":"null_rate","level":"warn","message":"86.0% null"}],"column":"product_name_fr_imported","extras":{"singletons":7,"top_values":[["CRISTALINE Eau De Source 0.5L",1],["Biscuits Nutella x22 biscuits fourr\u00e9s - 304g",1],["Wasa tartine croustillante authentique au seigle 275g",1],["Wasa tartine croustillante fibres 230g",1],["Chips Pringles Original",1],["NESTLE DESSERT Noir 205g",1],["Brioche Tranch\u00e9e Bio 400g",1]]},"kind":"categorical","n":50,"n_null":43,"n_unique":7,"null_rate":0.86,"stats":{"cardinality":7,"entropy":2.807354922057604,"entropy_ratio":1.0,"top_rate":0.14285714285714285,"top_value":"CRISTALINE Eau De Source 0.5L"}},{"alerts":[{"code":"long_tail","level":"info","message":"5 singleton categories"},{"code":"null_rate","level":"warn","message":"86.0% null"}],"column":"brands_imported","extras":{"singletons":5,"top_values":[["Wasa",2],["Cristaline",1],["Nutella biscuits",1],["Pringles",1],["NESTLE DESSERT,Tablettes",1],["La boulangere",1]]},"kind":"categorical","n":50,"n_null":43,"n_unique":6,"null_rate":0.86,"stats":{"cardinality":6,"entropy":2.5216406363433186,"entropy_ratio":0.9755037590061086,"top_rate":0.2857142857142857,"top_value":"Wasa"}},{"alerts":[{"code":"long_tail","level":"info","message":"4 singleton categories"},{"code":"null_rate","level":"warn","message":"88.0% null"}],"column":"owner_imported","extras":{"singletons":4,"top_values":[["org-barilla-france-sa",2],["org-gie-sources-alma",1],["org-ferrero-france-commerciale",1],["org-nestle-france",1],["org-la-boulangere-co",1]]},"kind":"categorical","n":50,"n_null":44,"n_unique":5,"null_rate":0.88,"stats":{"cardinality":5,"entropy":2.2516291673878226,"entropy_ratio":0.9697238998682473,"top_rate":0.3333333333333333,"top_value":"org-barilla-france-sa"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"product_name_zh_debug_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"null_rate","level":"warn","message":"84.0% null"}],"column":"lc_imported","extras":{"singletons":1,"top_values":[["fr",7],["es",1]]},"kind":"categorical","n":50,"n_null":42,"n_unique":2,"null_rate":0.84,"stats":{"cardinality":2,"entropy":0.5435644431995964,"entropy_ratio":0.5435644431995964,"top_rate":0.875,"top_value":"fr"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_zh","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"7 singleton categories"},{"code":"null_rate","level":"warn","message":"86.0% null"}],"column":"quantity_imported","extras":{"singletons":7,"top_values":[["500 ml",1],["304 g",1],["275 g",1],["230 g",1],["175 g",1],["205 g",1],["400 g",1]]},"kind":"categorical","n":50,"n_null":43,"n_unique":7,"null_rate":0.86,"stats":{"cardinality":7,"entropy":2.807354922057604,"entropy_ratio":1.0,"top_rate":0.14285714285714285,"top_value":"500 ml"}},{"alerts":[{"code":"null_rate","level":"warn","message":"84.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"nutrition_data_per_imported","extras":{"singletons":0,"top_values":[["100g",8]]},"kind":"categorical","n":50,"n_null":42,"n_unique":1,"null_rate":0.84,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"100g"}},{"alerts":[{"code":"long_tail","level":"info","message":"7 singleton categories"},{"code":"null_rate","level":"warn","message":"86.0% null"}],"column":"generic_name_fr_imported","extras":{"singletons":7,"top_values":[["Eau De Source",1],["Biscuit fourr\u00e9 \u00e0 la p\u00e2te \u00e0 tartiner aux noisettes et au cacao Nutella\u00ae",1],["Pain croustillant a la farine de seigle",1],["Pain croustillant \u00e0 la farine compl\u00e8te de seigle, avoine et s\u00e9same.",1],["Snack sal\u00e9",1],["Chocolat noir sup\u00e9rieur",1],["Brioche tranch\u00e9e issue de l'agriculture biologique",1]]},"kind":"categorical","n":50,"n_null":43,"n_unique":7,"null_rate":0.86,"stats":{"cardinality":7,"entropy":2.807354922057604,"entropy_ratio":1.0,"top_rate":0.14285714285714285,"top_value":"Eau De Source"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"owner_fields","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"4 singleton categories"},{"code":"null_rate","level":"warn","message":"88.0% null"}],"column":"categories_imported","extras":{"singletons":4,"top_values":[["Snacks, Snacks sal\u00e9s, Amuse-gueules, Chips et frites, Chips",2],["Boissons et pr\u00e9parations de boissons, Boissons, Eaux, Eaux de sources",1],["Snacks, Snacks sucr\u00e9s, Biscuits et g\u00e2teaux, Biscuits sucr\u00e9s & biscuits ap\u00e9ritifs, Biscuits, en:Biscuits/Cookies (Shelf Stable)",1],["Snacks, Snacks sucr\u00e9s, Cacao et d\u00e9riv\u00e9s, Chocolats, Chocolats noirs, Chocolat noir p\u00e2tissier en tablette \u00e0 40% de cacao minimum",1],["Snacks, Snacks sucr\u00e9s, en:Sweet pastries and pies, Viennoiseries",1]]},"kind":"categorical","n":50,"n_null":44,"n_unique":5,"null_rate":0.88,"stats":{"cardinality":5,"entropy":2.2516291673878226,"entropy_ratio":0.9697238998682473,"top_rate":0.3333333333333333,"top_value":"Snacks, Snacks sal\u00e9s, Amuse-gueules, Chips et frites, Chips"}},{"alerts":[{"code":"long_tail","level":"info","message":"7 singleton categories"},{"code":"null_rate","level":"warn","message":"86.0% null"}],"column":"conservation_conditions_fr","extras":{"singletons":7,"top_values":[["A conserver de pr\u00e9f\u00e9rence \u00e0 l'abri du soleil, dans un endroit propre, frais et sans odeur.",1],["A conserver au sec et \u00e0 l'abri de la chaleur. Ne pas mettre au r\u00e9frig\u00e9rateur.",1],["A conserver dans un endroit sec \u00e0 l'abri de la lumi\u00e8re.",1],["Conserver dans un endroit frais et sec.",1],["\u00c0 conserver dans un endroit sec",1],["A conserver au frais et au sec.",1],["\u00c0 conserver dans son emballage ferm\u00e9, dans un endroit sec, \u00e0 temp\u00e9rature ambiante.",1]]},"kind":"categorical","n":50,"n_null":43,"n_unique":7,"null_rate":0.86,"stats":{"cardinality":7,"entropy":2.807354922057604,"entropy_ratio":1.0,"top_rate":0.14285714285714285,"top_value":"A conserver de pr\u00e9f\u00e9rence \u00e0 l'abri du soleil, dans un endroit propre, frais et sans odeur."}},{"alerts":[{"code":"long_tail","level":"info","message":"7 singleton categories"},{"code":"null_rate","level":"warn","message":"86.0% null"}],"column":"conservation_conditions","extras":{"singletons":7,"top_values":[["A conserver de pr\u00e9f\u00e9rence \u00e0 l'abri du soleil, dans un endroit propre, frais et sans odeur.",1],["A conserver au sec et \u00e0 l'abri de la chaleur. Ne pas mettre au r\u00e9frig\u00e9rateur.",1],["A conserver dans un endroit sec \u00e0 l'abri de la lumi\u00e8re.",1],["Conserver dans un endroit frais et sec.",1],["\u00c0 conserver dans un endroit sec",1],["A conserver au frais et au sec.",1],["\u00c0 conserver dans son emballage ferm\u00e9, dans un endroit sec, \u00e0 temp\u00e9rature ambiante.",1]]},"kind":"categorical","n":50,"n_null":43,"n_unique":7,"null_rate":0.86,"stats":{"cardinality":7,"entropy":2.807354922057604,"entropy_ratio":1.0,"top_rate":0.14285714285714285,"top_value":"A conserver de pr\u00e9f\u00e9rence \u00e0 l'abri du soleil, dans un endroit propre, frais et sans odeur."}},{"alerts":[{"code":"null_rate","level":"warn","message":"84.0% null"}],"column":"countries_imported","extras":{"singletons":1,"top_values":[["France",7],["Espa\u00f1a",1]]},"kind":"categorical","n":50,"n_null":42,"n_unique":2,"null_rate":0.84,"stats":{"cardinality":2,"entropy":0.5435644431995964,"entropy_ratio":0.5435644431995964,"top_rate":0.875,"top_value":"France"}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"96.0% null"}],"column":"origins_fr","extras":{"singletons":2,"top_values":[["Chambon-la-For\u00eat,France,Cairanne,Provence-Alpes-C\u00f4te d'Azur,Vaucluse,Italie,Source Sainte C\u00e9cile,Source Of\u00e9lia,Source \u00c9l\u00e9onore,Source Emma,Source \u00c9l\u00e9na",1],["",1]]},"kind":"categorical","n":50,"n_null":48,"n_unique":2,"null_rate":0.96,"stats":{"cardinality":2,"entropy":1.0,"entropy_ratio":1.0,"top_rate":0.5,"top_value":"Chambon-la-For\u00eat,France,Cairanne,Provence-Alpes-C\u00f4te d'Azur,Vaucluse,Italie,Source Sainte C\u00e9cile,Source Of\u00e9lia,Source \u00c9l\u00e9onore,Source Emma,Source \u00c9l\u00e9na"}},{"alerts":[{"code":"long_tail","level":"info","message":"7 singleton categories"},{"code":"null_rate","level":"warn","message":"86.0% null"}],"column":"abbreviated_product_name","extras":{"singletons":7,"top_values":[["CRISTALINE Eau De Source 0.5L",1],["Nutella biscuits t22",1],["Authentique 275g, fr",1],["Fibres 230g, fr",1],["ORG Original 175g",1],["NESTLE DESSERT Noir 205g",1],["BRIOCHE TRANCHEE BIO 400g",1]]},"kind":"categorical","n":50,"n_null":43,"n_unique":7,"null_rate":0.86,"stats":{"cardinality":7,"entropy":2.807354922057604,"entropy_ratio":1.0,"top_rate":0.14285714285714285,"top_value":"CRISTALINE Eau De Source 0.5L"}},{"alerts":[{"code":"long_tail","level":"info","message":"5 singleton categories"},{"code":"null_rate","level":"warn","message":"86.0% null"}],"column":"customer_service","extras":{"singletons":5,"top_values":[["Service Consommateurs, : www.wasa.com/fr-fr/contact (depuis la France), www.wasa.com/fr-be/contact (depuis la Belgique)",2],["Service Consommateurs Cristaline, 70 avenue des Sources 03270 SAINT YORRE",1],["FERRERO FRANCE COMMERCIALE - Service Consommateurs, CS 90058 - 76136 MONT SAINT AIGNAN Cedex",1],["Service Conseil Consommateurs, Kellogg's Produits Alimentaires S.A.S. - Immeuble Neptune - 1 rue Galil\u00e9e 93160 Noisy-le-Grand (France)",1],["Nestl\u00e9 France, BP 900 Noisiel 77446 Marne la Vall\u00e9e Cedex 2",1],["Service consommateurs La Boulang\u00e8re & Co, La Boulang\u00e8re & Co 1 rue du petit bocage CS 40 201 85140 ESSARTS",1]]},"kind":"categorical","n":50,"n_null":43,"n_unique":6,"null_rate":0.86,"stats":{"cardinality":6,"entropy":2.5216406363433186,"entropy_ratio":0.9755037590061086,"top_rate":0.2857142857142857,"top_value":"Service Consommateurs, : www.wasa.com/fr-fr/contact (depuis la France), www.wasa.com/fr-be/contact (depuis la Belgique)"}},{"alerts":[{"code":"long_tail","level":"info","message":"8 singleton categories"},{"code":"null_rate","level":"warn","message":"84.0% null"}],"column":"data_sources_imported","extras":{"singletons":8,"top_values":[["Producers, Producer - gie-sources-alma, Database - Equadis, Database - GDSN, Databases, Producers, Producer - gie-sources-alma",1],["Producers, Producer - ferrero-france-commerciale, Database - Equadis, Database - GDSN, Databases, Producers, Producer - ferrero-france-commerciale",1],["Database - Equadis, Database - GDSN, Databases, Producers, Producer - barilla-france-sa, Producers, Producer - barilla-france-sa",1],["Apps, app-elcoco",1],["Producers, Producer - barilla-france-sa, Database - Equadis, Database - GDSN, Databases, Producers, Producer - barilla-france-sa",1],["Database - CodeOnline, Database - GDSN, Databases",1],["Database - Equadis, Database - GDSN, Databases, Producers, Producer - nestle-france, Producers, Producer - nestle-france",1],["Producers, Producer - la-boulangere-co, Database - Equadis, Database - GDSN, Databases, Producers, Producer - la-boulangere-co",1]]},"kind":"categorical","n":50,"n_null":42,"n_unique":8,"null_rate":0.84,"stats":{"cardinality":8,"entropy":3.0,"entropy_ratio":1.0,"top_rate":0.125,"top_value":"Producers, Producer - gie-sources-alma, Database - Equadis, Database - GDSN, Databases, Producers, Producer - gie-sources-alma"}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"nova_group_error","extras":{"singletons":0,"top_values":[["too_many_unknown_ingredients",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"too_many_unknown_ingredients"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_de_ocr_1648897071_result","extras":{"singletons":1,"top_values":[["Nuss-Nougat-Creme 40% (Zucker, Palm\u00f6l, _Haseln\u00fcsse_ 13%, _Magermilchpulver_ 8,7%, fettarmer Kakao 7,4%, Emulgator Lecithine (_Soja_), Vanillin), _Weizenmehl_ 32,5%, pflanzliche Fette (Palm, Palmkern), Rohrzucker 8,5% (enth\u00e4lt _Weizen_), _Milchzucker_, _Weizenkleie_, _Vollmilchpulver_, _Gerstenmalz_ - und Maisextraktpulver, Honig, Backtriebmittel: Dinatriumdiphosphat, Natriumhydrogencarbonat, Ammoniumhydrogencarbonat; fettarmer Kakao, Salz, _Weizenst\u00e4rke_, _Gerstenmalzmehl_, Emulgator Lecithine (_Soja_), Vanillin",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Nuss-Nougat-Creme 40% (Zucker, Palm\u00f6l, _Haseln\u00fcsse_ 13%, _Magermilchpulver_ 8,7%, fettarmer Kakao 7,4%, Emulgator Lecithine (_Soja_), Vanillin), _Weizenmehl_ 32,5%, pflanzliche Fette (Palm, Palmkern), Rohrzucker 8,5% (enth\u00e4lt _Weizen_), _Milchzucker_, _Weizenkleie_, _Vollmilchpulver_, _Gerstenmalz_ - und Maisextraktpulver, Honig, Backtriebmittel: Dinatriumdiphosphat, Natriumhydrogencarbonat, Ammoniumhydrogencarbonat; fettarmer Kakao, Salz, _Weizenst\u00e4rke_, _Gerstenmalzmehl_, Emulgator Lecithine (_Soja_), Vanillin"}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_ro","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"96.0% null"}],"column":"product_name_ro","extras":{"singletons":2,"top_values":[["",1],["Sour Cream & Onion",1]]},"kind":"categorical","n":50,"n_null":48,"n_unique":2,"null_rate":0.96,"stats":{"cardinality":2,"entropy":1.0,"entropy_ratio":1.0,"top_rate":0.5,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"92.0% null"}],"column":"producer_version_id","extras":{"singletons":2,"top_values":[["1",2],["2021-01-25T13:53:49+01:00",1],["44217063",1]]},"kind":"categorical","n":50,"n_null":46,"n_unique":3,"null_rate":0.92,"stats":{"cardinality":3,"entropy":1.5,"entropy_ratio":0.9463946303571862,"top_rate":0.5,"top_value":"1"}},{"alerts":[{"code":"long_tail","level":"info","message":"6 singleton categories"},{"code":"null_rate","level":"warn","message":"88.0% null"}],"column":"serving_size_imported","extras":{"singletons":6,"top_values":[["13.8 g (1)",1],["11.4 g (1 tranche)",1],["10 g (1 tranche)",1],["30 g",1],["25.6 g (5 carr\u00e9s (25,6 g))",1],["26.7 g (1 tranche de 26.7 g environ)",1]]},"kind":"categorical","n":50,"n_null":44,"n_unique":6,"null_rate":0.88,"stats":{"cardinality":6,"entropy":2.584962500721156,"entropy_ratio":1.0,"top_rate":0.16666666666666666,"top_value":"13.8 g (1)"}},{"alerts":[{"code":"null_rate","level":"warn","message":"92.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"no_nutrition_data_imported","extras":{"singletons":0,"top_values":[["false",4]]},"kind":"categorical","n":50,"n_null":46,"n_unique":1,"null_rate":0.92,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"false"}},{"alerts":[{"code":"null_rate","level":"warn","message":"92.0% null"}],"column":"packaging_imported","extras":{"singletons":1,"top_values":[["Enveloppe",3],["Bo\u00eete, Barquette",1]]},"kind":"categorical","n":50,"n_null":46,"n_unique":2,"null_rate":0.92,"stats":{"cardinality":2,"entropy":0.8112781244591328,"entropy_ratio":0.8112781244591328,"top_rate":0.75,"top_value":"Enveloppe"}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_ro","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"92.0% null"}],"column":"producer_version_id_imported","extras":{"singletons":2,"top_values":[["1",2],["2021-01-25T13:53:49+01:00",1],["44217063",1]]},"kind":"categorical","n":50,"n_null":46,"n_unique":3,"null_rate":0.92,"stats":{"cardinality":3,"entropy":1.5,"entropy_ratio":0.9463946303571862,"top_rate":0.5,"top_value":"1"}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"90.0% null"}],"column":"labels_imported","extras":{"singletons":2,"top_values":[["V\u00e9g\u00e9tarien",3],["Point Vert, Rainforest Alliance, Triman",1],["Commerce \u00e9quitable, Bio, Bio europ\u00e9en, en:organic",1]]},"kind":"categorical","n":50,"n_null":45,"n_unique":3,"null_rate":0.9,"stats":{"cardinality":3,"entropy":1.3709505944546687,"entropy_ratio":0.8649735207179273,"top_rate":0.6,"top_value":"V\u00e9g\u00e9tarien"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_de_ocr_1648990410_result","extras":{"singletons":1,"top_values":[["Kekse mit Nuss - Nugat - Creme - F\u00fcllung: Nuss-Nugat-Creme 40% (Zucker, Palm\u00f6l, HASELN\u00dcSSE  Magermilchpulver, fettarmer Kakao, Emulgator Lecithine (S0JA), Vanillin, Weizenmehl, pflanzliche Fette ( Palm, Palmkern), Rohrzucker, Milchzucker, Weizenkleie, VOLLMILCHPULVER, GERSTENMALZ-und Maisextraktpulver, Honig. Backtriebmittel: Dinatriumdiphosphat, Natriumhydrogencarbonat, Ammoniumhydrogencarbonat; fettarmer Kakao, Salz, Weizenst\u00e4rke, Gerstenmalzmehl, Emulgator Lecithine (Soja), Vanillin",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Kekse mit Nuss - Nugat - Creme - F\u00fcllung: Nuss-Nugat-Creme 40% (Zucker, Palm\u00f6l, HASELN\u00dcSSE  Magermilchpulver, fettarmer Kakao, Emulgator Lecithine (S0JA), Vanillin, Weizenmehl, pflanzliche Fette ( Palm, Palmkern), Rohrzucker, Milchzucker, Weizenkleie, VOLLMILCHPULVER, GERSTENMALZ-und Maisextraktpulver, Honig. Backtriebmittel: Dinatriumdiphosphat, Natriumhydrogencarbonat, Ammoniumhydrogencarbonat; fettarmer Kakao, Salz, Weizenst\u00e4rke, Gerstenmalzmehl, Emulgator Lecithine (Soja), Vanillin"}},{"alerts":[{"code":"long_tail","level":"info","message":"3 singleton categories"},{"code":"null_rate","level":"warn","message":"90.0% null"}],"column":"allergens_imported","extras":{"singletons":3,"top_values":[["Gluten",2],["Gluten, Lait, Fruits \u00e0 coque, Soja, Gs1:T4078:ML",1],["Gluten, Graines de s\u00e9same",1],["\u0152ufs, Gluten",1]]},"kind":"categorical","n":50,"n_null":45,"n_unique":4,"null_rate":0.9,"stats":{"cardinality":4,"entropy":1.9219280948873623,"entropy_ratio":0.9609640474436811,"top_rate":0.4,"top_value":"Gluten"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_de_ocr_1648990410","extras":{"singletons":1,"top_values":[["Kekse mit Nuss - Nugat- Creme - F\u00fcllung: Nuss-Nugat-Creme 40% (Zucker, Palm\u00f6l, HASELN\u00dcSSE  Magermilchpulver, fettarmer Kakao, Emulgator Lecithine (S0JA), Vanillin, Weizenmehl, pflanzliche Fette ( Palm, Palmkern), Rohrzucker, Milchzucker, Weizenkleie, VOLLMILCHPULVER, GERSTENMALZ-und Maisextraktpulver, Honig. Backtriebmittel: Dinatriumdiphosphat, Natriumhydrogencarbonat, Ammoniumhydrogencarbonat; fettarmer Kakao, Salz, Weizenst\u00e4rke, Gerstenmalzmehl, Emulgator Lecithine (Soja), Vanillin",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Kekse mit Nuss - Nugat- Creme - F\u00fcllung: Nuss-Nugat-Creme 40% (Zucker, Palm\u00f6l, HASELN\u00dcSSE  Magermilchpulver, fettarmer Kakao, Emulgator Lecithine (S0JA), Vanillin, Weizenmehl, pflanzliche Fette ( Palm, Palmkern), Rohrzucker, Milchzucker, Weizenkleie, VOLLMILCHPULVER, GERSTENMALZ-und Maisextraktpulver, Honig. Backtriebmittel: Dinatriumdiphosphat, Natriumhydrogencarbonat, Ammoniumhydrogencarbonat; fettarmer Kakao, Salz, Weizenst\u00e4rke, Gerstenmalzmehl, Emulgator Lecithine (Soja), Vanillin"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_de_ocr_1648897071","extras":{"singletons":1,"top_values":[["Nuss-Nougat-Creme 40% (Zucker, Palm\u00f6l, _Haseln\u00fcsse_ 13%, _Magermilchpulver_ 8,7%, fettarmer Kakao 7,4%, Emulgator Lecithine (_Soja_), Vanillin), _Weizenmehl_ 32,5%, pflanzliche Fette (Palm, Palmkern), Rohrzucker 8,5% (enth\u00e4lt _Weizen_), _Milchzucker_, _Weizenkleie_, _Vollmilchpulver_, _Gerstenmalz_- und Maisextraktpulver, Honig, Backtriebmittel: Dinatriumdiphosphat, Natriumhydrogencarbonat, Ammoniumhydrogencarbonat; fettarmer Kakao, Salz, _Weizenst\u00e4rke_, _Gerstenmalzmehl_, Emulgator Lecithine (_Soja_), Vanillin",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Nuss-Nougat-Creme 40% (Zucker, Palm\u00f6l, _Haseln\u00fcsse_ 13%, _Magermilchpulver_ 8,7%, fettarmer Kakao 7,4%, Emulgator Lecithine (_Soja_), Vanillin), _Weizenmehl_ 32,5%, pflanzliche Fette (Palm, Palmkern), Rohrzucker 8,5% (enth\u00e4lt _Weizen_), _Milchzucker_, _Weizenkleie_, _Vollmilchpulver_, _Gerstenmalz_- und Maisextraktpulver, Honig, Backtriebmittel: Dinatriumdiphosphat, Natriumhydrogencarbonat, Ammoniumhydrogencarbonat; fettarmer Kakao, Salz, _Weizenst\u00e4rke_, _Gerstenmalzmehl_, Emulgator Lecithine (_Soja_), Vanillin"}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"generic_name_ro","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_ro","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"3 singleton categories"},{"code":"null_rate","level":"warn","message":"94.0% null"}],"column":"abbreviated_product_name_imported","extras":{"singletons":3,"top_values":[["Authentique 275g, fr",1],["Fibres 230g, fr",1],["DESSERT Noir 205g",1]]},"kind":"categorical","n":50,"n_null":47,"n_unique":3,"null_rate":0.94,"stats":{"cardinality":3,"entropy":1.584962500721156,"entropy_ratio":1.0,"top_rate":0.3333333333333333,"top_value":"Authentique 275g, fr"}},{"alerts":[{"code":"long_tail","level":"info","message":"4 singleton categories"},{"code":"null_rate","level":"warn","message":"92.0% null"}],"column":"traces_imported","extras":{"singletons":4,"top_values":[["Lupin, Lait, Moutarde, Graines de s\u00e9same, Soja",1],["Lupin, Lait, Moutarde, Soja",1],["Lait, Fruits \u00e0 coque",1],["Lait, Moutarde, Soja",1]]},"kind":"categorical","n":50,"n_null":46,"n_unique":4,"null_rate":0.92,"stats":{"cardinality":4,"entropy":2.0,"entropy_ratio":1.0,"top_rate":0.25,"top_value":"Lupin, Lait, Moutarde, Graines de s\u00e9same, Soja"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"specific_ingredients","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"null_rate","level":"warn","message":"94.0% null"}],"column":"product_name_ru","extras":{"singletons":1,"top_values":[["",2],["\u042d\u043a\u0441\u0435\u043b\u0435\u043d\u0441 99% \u043a\u0430\u043a\u0430\u043e",1]]},"kind":"categorical","n":50,"n_null":47,"n_unique":2,"null_rate":0.94,"stats":{"cardinality":2,"entropy":0.9182958340544896,"entropy_ratio":0.9182958340544896,"top_rate":0.6666666666666666,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"94.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_ru","extras":{"singletons":0,"top_values":[["",3]]},"kind":"categorical","n":50,"n_null":47,"n_unique":1,"null_rate":0.94,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"94.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_with_allergens_ru","extras":{"singletons":0,"top_values":[["",3]]},"kind":"categorical","n":50,"n_null":47,"n_unique":1,"null_rate":0.94,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"94.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_ru","extras":{"singletons":0,"top_values":[["",3]]},"kind":"categorical","n":50,"n_null":47,"n_unique":1,"null_rate":0.94,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"94.0% null"}],"column":"generic_name_ru","extras":{"singletons":1,"top_values":[["",2],["\u041f\u043b\u0438\u0442\u043a\u0430 \u0433\u043e\u0440\u044c\u043a\u043e\u0433\u043e \u0448\u043e\u043a\u043e\u043b\u0430\u0434\u0430 (99% \u043a\u0430\u043a\u0430\u043e)",1]]},"kind":"categorical","n":50,"n_null":47,"n_unique":2,"null_rate":0.94,"stats":{"cardinality":2,"entropy":0.9182958340544896,"entropy_ratio":0.9182958340544896,"top_rate":0.6666666666666666,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"94.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_ru","extras":{"singletons":0,"top_values":[["",3]]},"kind":"categorical","n":50,"n_null":47,"n_unique":1,"null_rate":0.94,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"96.0% null"}],"column":"ingredients_text_da","extras":{"singletons":2,"top_values":[["_VETEMJ\u00d6L_/_HVEDEMEL_, palmolja/-olie, glukossirap, maltextrakt fr\u00e5n _KORN_/_BYG_, bakpulver/h\u00e6vemidler (ammoniumkarbonater, natriumkarbonater), salt, _\u00c4GG_/_\u00c6G_/_EGG_, arom, mj\u00f6lbehandlingsmedel/melbehandlingsmiddel (_NATRIUMDISULFIT_).",1],["",1]]},"kind":"categorical","n":50,"n_null":48,"n_unique":2,"null_rate":0.96,"stats":{"cardinality":2,"entropy":1.0,"entropy_ratio":1.0,"top_rate":0.5,"top_value":"_VETEMJ\u00d6L_/_HVEDEMEL_, palmolja/-olie, glukossirap, maltextrakt fr\u00e5n _KORN_/_BYG_, bakpulver/h\u00e6vemidler (ammoniumkarbonater, natriumkarbonater), salt, _\u00c4GG_/_\u00c6G_/_EGG_, arom, mj\u00f6lbehandlingsmedel/melbehandlingsmiddel (_NATRIUMDISULFIT_)."}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"96.0% null"}],"column":"ingredients_text_with_allergens_da","extras":{"singletons":2,"top_values":[["<span class=\"allergen\">VETEMJ\u00d6L</span>/<span class=\"allergen\">HVEDEMEL</span>, palmolja/-olie, glukossirap, maltextrakt fr\u00e5n <span class=\"allergen\">KORN</span>/<span class=\"allergen\">BYG</span>, bakpulver/h\u00e6vemidler (ammoniumkarbonater, natriumkarbonater), salt, <span class=\"allergen\">\u00c4GG</span>/<span class=\"allergen\">\u00c6G</span>/<span class=\"allergen\">EGG</span>, arom, mj\u00f6lbehandlingsmedel/melbehandlingsmiddel (<span class=\"allergen\">NATRIUMDISULFIT</span>).",1],["",1]]},"kind":"categorical","n":50,"n_null":48,"n_unique":2,"null_rate":0.96,"stats":{"cardinality":2,"entropy":1.0,"entropy_ratio":1.0,"top_rate":0.5,"top_value":"<span class=\"allergen\">VETEMJ\u00d6L</span>/<span class=\"allergen\">HVEDEMEL</span>, palmolja/-olie, glukossirap, maltextrakt fr\u00e5n <span class=\"allergen\">KORN</span>/<span class=\"allergen\">BYG</span>, bakpulver/h\u00e6vemidler (ammoniumkarbonater, natriumkarbonater), salt, <span class=\"allergen\">\u00c4GG</span>/<span class=\"allergen\">\u00c6G</span>/<span class=\"allergen\">EGG</span>, arom, mj\u00f6lbehandlingsmedel/melbehandlingsmiddel (<span class=\"allergen\">NATRIUMDISULFIT</span>)."}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"96.0% null"}],"column":"product_name_da","extras":{"singletons":2,"top_values":[["Original",1],["Alpine Milk",1]]},"kind":"categorical","n":50,"n_null":48,"n_unique":2,"null_rate":0.96,"stats":{"cardinality":2,"entropy":1.0,"entropy_ratio":1.0,"top_rate":0.5,"top_value":"Original"}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_da","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"96.0% null"}],"column":"generic_name_da","extras":{"singletons":2,"top_values":[["Kiks",1],["",1]]},"kind":"categorical","n":50,"n_null":48,"n_unique":2,"null_rate":0.96,"stats":{"cardinality":2,"entropy":1.0,"entropy_ratio":1.0,"top_rate":0.5,"top_value":"Kiks"}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"forest_footprint_data","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_da","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_sr","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_nl_ocr_1675675383_result","extras":{"singletons":1,"top_values":[["Cacaomassa, suiker, cacaoboter, natuurlijk Bourbon vanille - stokje.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Cacaomassa, suiker, cacaoboter, natuurlijk Bourbon vanille - stokje."}},{"alerts":[{"code":"null_rate","level":"warn","message":"94.0% null"}],"column":"ingredients_text_cs","extras":{"singletons":1,"top_values":[["",2],["Kakaov\u00e1 hmota, cukr, kakaov\u00e9 m\u00e1slo, vanilka.",1]]},"kind":"categorical","n":50,"n_null":47,"n_unique":2,"null_rate":0.94,"stats":{"cardinality":2,"entropy":0.9182958340544896,"entropy_ratio":0.9182958340544896,"top_rate":0.6666666666666666,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"94.0% null"}],"column":"product_name_cs","extras":{"singletons":1,"top_values":[["",2],["Excellence 70% Cocoa Intense Dark",1]]},"kind":"categorical","n":50,"n_null":47,"n_unique":2,"null_rate":0.94,"stats":{"cardinality":2,"entropy":0.9182958340544896,"entropy_ratio":0.9182958340544896,"top_rate":0.6666666666666666,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"92.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_hu","extras":{"singletons":0,"top_values":[["",4]]},"kind":"categorical","n":50,"n_null":46,"n_unique":1,"null_rate":0.92,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"92.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_hu","extras":{"singletons":0,"top_values":[["",4]]},"kind":"categorical","n":50,"n_null":46,"n_unique":1,"null_rate":0.92,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_cs","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"3 singleton categories"},{"code":"null_rate","level":"warn","message":"94.0% null"}],"column":"ingredients_text_with_allergens_hu","extras":{"singletons":3,"top_values":[["Kaka\u00f3massza, cukor, kaka\u00f3 - <span class=\"allergen\">vaj</span>, van\u00edlia.",1],["HU \u00c9tcsokol\u00e1d\u00e9. Kaka\u00f3 sz\u00e1razanyag legal\u00e1bb 70% . \u00d6Sszetev\u0151k: kaka\u00f3massza, cukor, kaka\u00f3vaj, emulge\u00e1l\u00f3szerek: lecitinek (<span class=\"allergen\">sz\u00f3j\u00e1b\u00f3l</span>); van\u00edlia kivonat. Nyomokban di\u00f3f\u00e9l\u00e9ket \u00e9s <span class=\"allergen\">tejet</span> tartalmazhat. Bontatlan csomagol\u00e1sban t\u00e1rolva min\u0151s\u00e9g\u00e9t meg\u00f3rzi (nap/h\u00f3nap/\u00e9v): a csomagol\u00e1s h\u00e1toldal\u00e1n felt\u00fcntetett id\u0151pontig. Sz\u00e1raz, h\u0171v\u00f6s helyen t\u00e1roland\u00f3! K\u00e9sz\u00fclt: N\u00e9metorsz\u00e1gban. A kaka\u00f3bab sz\u00e1rmaz\u00e1si helye: Ecuador, Elef\u00e1ntcsontpart, Gh\u00e1na, Kamerun \u00e9s Nigeria. A Fairtrade Cocoa Program (Fairtrade Kaka\u00f3 Program) el\u0151ny\u00f6kh\u00f6z juttatja a kistermel\u0151ket az\u00e1ltal, hogy t\u00f6bb kaka\u00f3t \u00e9rt\u00e9kes\u00edtenek Fairtrade term\u00e9kk\u00e9nt. L\u00e1togasson el a www.info.fairtrade.net/program oldalra. \r\n\r\nRO Ciocolat\u0103 am\u0103ruie. Substant\u0103 uscat\u0103 de cacao minimum 70% Ingrediente: mas\u0103 de cacao, zah\u0103r, unt de cacao, emulsifiant: lecitine din soia; extract din vanilie. Cu ingrediente din t\u0103ri UE \u015fi non UE. Poate contine urme de fructe cu coaj\u0103 lemnoas\u0103 \u015fi lapte. A se consuma de preferint\u0103 \u00eenainte de/Nr. Lot: vezi spate ambalaj. A se p\u0103stra la loc uscat \u015fi r\u0103coros, ferit de razele soarelui \u0219i de \u00eenghet, at\u00e2t \u00eenainte, c\u00e2t \u015fi dup\u0103 deschidere. A se consuma \u00een cel mai scurt timp dup\u0103 deschidere. Fairtrade Cocoa Program (Programul Fairtrade de Cacao) permite micilor agricultori s\u0103 beneficieze de v\u00e2nzarea propriei cacao ca Fairtrade. Vizita\u021bi www.info.fairtrade.net/program. Produs in U.E. pentru S.C. Lidl Discount SRL, Sat Nedelea, Comuna Arice\u015ftii Rahtivani, DN 72, Cr\u00e2ngul lui Bot, KM 73+810, jude\u021bul Prahova, Rom\u00e2nia. \r\n\r\nBG \u041d\u0430\u0442\u0443\u0440\u0430\u043b\u0435\u043d \u0448\u043e\u043a\u043e\u043b\u0430\u0434. \u0421\u044a\u0434\u044a\u0440\u0436\u0430 \u043c\u0438\u043d. 70% \u043a\u0430\u043a\u0430\u043e\u0432\u0430 \u043c\u0430\u0441\u0430. \u0421\u044a\u0441\u0442\u0430\u0432\u043a\u0438: \u043a\u0430\u043a\u0430\u043e\u0432\u0430 \u043c\u0430\u0441\u0430, \u0437\u0430\u0445\u0430\u0440, \u043a\u0430\u043a\u0430\u043e\u0432\u043e \u043c\u0430\u0441\u043b\u043e, \u0435\u043c\u0443\u043b\u0433\u0430\u0442\u043e\u0440: \u043b\u0435\u0446\u0438\u0442\u0438\u043d (\u0441\u043e\u0435\u0432); \u0435\u043a\u0441\u0442\u0440\u0430\u043a\u0442 \u043e\u0442 \u0432\u0430\u043d\u0438\u043b\u0438\u044f. \u041c\u043e\u0436\u0435 \u0434\u0430 \u0441\u044a\u0434\u044a\u0440\u0436\u0430 \u0441\u043b\u0435\u0434\u0438 \u043e\u0442 \u044f\u0434\u043a\u0438 \u0438 \u043c\u043b\u044f\u043a\u043e. \u041d\u0435\u043e\u0442\u0432\u043e\u0440\u0435\u043d \u043d\u0430\u0439-\u0434\u043e\u0431\u044a\u0440 \u0434\u043e:/ \u041f\u0430\u0440\u0442\u0438\u0434\u0430: \u0432\u0438\u0436 \u0437\u0430\u0434\u043d\u0430\u0442\u0430 \u0441\u0442\u0440\u0430\u043d\u0430. \u0414\u0430 \u0441\u0435 \u0441\u044a\u0445\u0440\u0430\u043d\u044f\u0432\u0430 \u043d\u0430 \u0441\u0443\u0445\u043e \u0438 \u0445\u043b\u0430\u0434\u043d\u043e \u043c\u044f\u0441\u0442\u043e. \u041f\u0440\u043e\u0433\u0440\u0430\u043c\u0430\u0442\u0430 \u0437\u0430 \u0441\u0435\u0440\u0442\u0438\u0444\u0438\u0446\u0438\u0440\u0430\u043d\u0435 \u043d\u0430 \u043a\u0430\u043a\u0430\u043e Fairtrade \u0421\u043e\u0441\u043e\u0430 Program \u0434\u0430\u0432\u0430 \u0432\u044a\u0437\u043c\u043e\u0436\u043d\u043e\u0441\u0442 \u043d\u0430 \u043c\u0430\u043b\u043a\u0438\u0442\u0435 \u043f\u0440\u043e\u0438\u0437\u0432\u043e\u0434\u0438\u0442\u0435\u043b\u0438 \u0434\u0430 \u043f\u0440\u043e\u0434\u0430\u0432\u0430\u0442 \u043f\u043e\u0432\u0435\u0447\u0435 \u043a\u0430\u043a\u0430\u043e \u043f\u0440\u0438 \u0441\u043f\u0440\u0430\u0432\u0435\u0434\u043b\u0438\u0432\u0438 \u0443\u0441\u043b\u043e\u0432\u0438\u044f \u043d\u0430 \u0442\u044a\u0440\u0433\u043e\u0432\u0438\u044f. \u041f\u043e\u0432\u0435\u0447\u0435 \u0438\u043d\u0444\u043e\u0440\u043c\u0430\u0446\u0438\u044f \u043d\u0430 www.info.fairtrade.net/program \u041f\u0440\u043e\u0438\u0437\u0432\u0435\u0434\u0435\u043d\u043e \u0432 \u0413\u0435\u0440\u043c\u0430\u043d\u0438\u044f \u0437\u0430 \u041b\u0438\u0434\u043b \u0429\u0438\u0444\u0442\u0443\u043d\u0433 \u0435\u043d\u0434 \u041a\u043e. \u041a\u0413, \u0429\u0438\u0444\u0442\u0441\u0431\u0435\u0440\u0433\u0449\u0440\u0430\u0441\u0435 1, 74167 \u041d\u0435\u043a\u0430\u0440\u0437\u0443\u043b\u043c, \u0413\u0435\u0440\u043c\u0430\u043d\u0438\u044f. LIDL",1],["Cukor, p\u00e1lmaolaj, <span class=\"allergen\">MOGYOR\u00d3</span> (13%), zs\u00edrszeg\u00e9ny kaka\u00f3por (7,4%), sov\u00e1ny <span class=\"allergen\">TEJPOR</span> (6,6%), <span class=\"allergen\">TEJSAV\u00d3POR</span>, emulge\u00e1l\u00f3szer: lecitinek (<span class=\"allergen\">SZ\u00d3JA</span>); aroma (vanillin).",1]]},"kind":"categorical","n":50,"n_null":47,"n_unique":3,"null_rate":0.94,"stats":{"cardinality":3,"entropy":1.584962500721156,"entropy_ratio":1.0,"top_rate":0.3333333333333333,"top_value":"Kaka\u00f3massza, cukor, kaka\u00f3 - <span class=\"allergen\">vaj</span>, van\u00edlia."}},{"alerts":[{"code":"null_rate","level":"warn","message":"94.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"generic_name_cs","extras":{"singletons":0,"top_values":[["",3]]},"kind":"categorical","n":50,"n_null":47,"n_unique":1,"null_rate":0.94,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"4 singleton categories"},{"code":"null_rate","level":"warn","message":"92.0% null"}],"column":"ingredients_text_hu","extras":{"singletons":4,"top_values":[["Kaka\u00f3massza, cukor, kaka\u00f3 - vaj, van\u00edlia.",1],["HU \u00c9tcsokol\u00e1d\u00e9. Kaka\u00f3 sz\u00e1razanyag legal\u00e1bb 70% . \u00d6Sszetev\u0151k: kaka\u00f3massza, cukor, kaka\u00f3vaj, emulge\u00e1l\u00f3szerek: lecitinek (sz\u00f3j\u00e1b\u00f3l); van\u00edlia kivonat. Nyomokban di\u00f3f\u00e9l\u00e9ket \u00e9s tejet tartalmazhat. Bontatlan csomagol\u00e1sban t\u00e1rolva min\u0151s\u00e9g\u00e9t meg\u00f3rzi (nap/h\u00f3nap/\u00e9v): a csomagol\u00e1s h\u00e1toldal\u00e1n felt\u00fcntetett id\u0151pontig. Sz\u00e1raz, h\u0171v\u00f6s helyen t\u00e1roland\u00f3! K\u00e9sz\u00fclt: N\u00e9metorsz\u00e1gban. A kaka\u00f3bab sz\u00e1rmaz\u00e1si helye: Ecuador, Elef\u00e1ntcsontpart, Gh\u00e1na, Kamerun \u00e9s Nigeria. A Fairtrade Cocoa Program (Fairtrade Kaka\u00f3 Program) el\u0151ny\u00f6kh\u00f6z juttatja a kistermel\u0151ket az\u00e1ltal, hogy t\u00f6bb kaka\u00f3t \u00e9rt\u00e9kes\u00edtenek Fairtrade term\u00e9kk\u00e9nt. L\u00e1togasson el a www.info.fairtrade.net/program oldalra. \r\n\r\nRO Ciocolat\u0103 am\u0103ruie. Substant\u0103 uscat\u0103 de cacao minimum 70% Ingrediente: mas\u0103 de cacao, zah\u0103r, unt de cacao, emulsifiant: lecitine din soia; extract din vanilie. Cu ingrediente din t\u0103ri UE \u015fi non UE. Poate contine urme de fructe cu coaj\u0103 lemnoas\u0103 \u015fi lapte. A se consuma de preferint\u0103 \u00eenainte de/Nr. Lot: vezi spate ambalaj. A se p\u0103stra la loc uscat \u015fi r\u0103coros, ferit de razele soarelui \u0219i de \u00eenghet, at\u00e2t \u00eenainte, c\u00e2t \u015fi dup\u0103 deschidere. A se consuma \u00een cel mai scurt timp dup\u0103 deschidere. Fairtrade Cocoa Program (Programul Fairtrade de Cacao) permite micilor agricultori s\u0103 beneficieze de v\u00e2nzarea propriei cacao ca Fairtrade. Vizita\u021bi www.info.fairtrade.net/program. Produs in U.E. pentru S.C. Lidl Discount SRL, Sat Nedelea, Comuna Arice\u015ftii Rahtivani, DN 72, Cr\u00e2ngul lui Bot, KM 73+810, jude\u021bul Prahova, Rom\u00e2nia. \r\n\r\nBG \u041d\u0430\u0442\u0443\u0440\u0430\u043b\u0435\u043d \u0448\u043e\u043a\u043e\u043b\u0430\u0434. \u0421\u044a\u0434\u044a\u0440\u0436\u0430 \u043c\u0438\u043d. 70% \u043a\u0430\u043a\u0430\u043e\u0432\u0430 \u043c\u0430\u0441\u0430. \u0421\u044a\u0441\u0442\u0430\u0432\u043a\u0438: \u043a\u0430\u043a\u0430\u043e\u0432\u0430 \u043c\u0430\u0441\u0430, \u0437\u0430\u0445\u0430\u0440, \u043a\u0430\u043a\u0430\u043e\u0432\u043e \u043c\u0430\u0441\u043b\u043e, \u0435\u043c\u0443\u043b\u0433\u0430\u0442\u043e\u0440: \u043b\u0435\u0446\u0438\u0442\u0438\u043d (\u0441\u043e\u0435\u0432); \u0435\u043a\u0441\u0442\u0440\u0430\u043a\u0442 \u043e\u0442 \u0432\u0430\u043d\u0438\u043b\u0438\u044f. \u041c\u043e\u0436\u0435 \u0434\u0430 \u0441\u044a\u0434\u044a\u0440\u0436\u0430 \u0441\u043b\u0435\u0434\u0438 \u043e\u0442 \u044f\u0434\u043a\u0438 \u0438 \u043c\u043b\u044f\u043a\u043e. \u041d\u0435\u043e\u0442\u0432\u043e\u0440\u0435\u043d \u043d\u0430\u0439-\u0434\u043e\u0431\u044a\u0440 \u0434\u043e:/ \u041f\u0430\u0440\u0442\u0438\u0434\u0430: \u0432\u0438\u0436 \u0437\u0430\u0434\u043d\u0430\u0442\u0430 \u0441\u0442\u0440\u0430\u043d\u0430. \u0414\u0430 \u0441\u0435 \u0441\u044a\u0445\u0440\u0430\u043d\u044f\u0432\u0430 \u043d\u0430 \u0441\u0443\u0445\u043e \u0438 \u0445\u043b\u0430\u0434\u043d\u043e \u043c\u044f\u0441\u0442\u043e. \u041f\u0440\u043e\u0433\u0440\u0430\u043c\u0430\u0442\u0430 \u0437\u0430 \u0441\u0435\u0440\u0442\u0438\u0444\u0438\u0446\u0438\u0440\u0430\u043d\u0435 \u043d\u0430 \u043a\u0430\u043a\u0430\u043e Fairtrade \u0421\u043e\u0441\u043e\u0430 Program \u0434\u0430\u0432\u0430 \u0432\u044a\u0437\u043c\u043e\u0436\u043d\u043e\u0441\u0442 \u043d\u0430 \u043c\u0430\u043b\u043a\u0438\u0442\u0435 \u043f\u0440\u043e\u0438\u0437\u0432\u043e\u0434\u0438\u0442\u0435\u043b\u0438 \u0434\u0430 \u043f\u0440\u043e\u0434\u0430\u0432\u0430\u0442 \u043f\u043e\u0432\u0435\u0447\u0435 \u043a\u0430\u043a\u0430\u043e \u043f\u0440\u0438 \u0441\u043f\u0440\u0430\u0432\u0435\u0434\u043b\u0438\u0432\u0438 \u0443\u0441\u043b\u043e\u0432\u0438\u044f \u043d\u0430 \u0442\u044a\u0440\u0433\u043e\u0432\u0438\u044f. \u041f\u043e\u0432\u0435\u0447\u0435 \u0438\u043d\u0444\u043e\u0440\u043c\u0430\u0446\u0438\u044f \u043d\u0430 www.info.fairtrade.net/program \u041f\u0440\u043e\u0438\u0437\u0432\u0435\u0434\u0435\u043d\u043e \u0432 \u0413\u0435\u0440\u043c\u0430\u043d\u0438\u044f \u0437\u0430 \u041b\u0438\u0434\u043b \u0429\u0438\u0444\u0442\u0443\u043d\u0433 \u0435\u043d\u0434 \u041a\u043e. \u041a\u0413, \u0429\u0438\u0444\u0442\u0441\u0431\u0435\u0440\u0433\u0449\u0440\u0430\u0441\u0435 1, 74167 \u041d\u0435\u043a\u0430\u0440\u0437\u0443\u043b\u043c, \u0413\u0435\u0440\u043c\u0430\u043d\u0438\u044f. LIDL",1],["Cukor, p\u00e1lmaolaj, _MOGYOR\u00d3_ (13%), zs\u00edrszeg\u00e9ny kaka\u00f3por (7,4%), sov\u00e1ny _TEJPOR_ (6,6%), _TEJSAV\u00d3POR_, emulge\u00e1l\u00f3szer: lecitinek (_SZ\u00d3JA_); aroma (vanillin).",1],["",1]]},"kind":"categorical","n":50,"n_null":46,"n_unique":4,"null_rate":0.92,"stats":{"cardinality":4,"entropy":2.0,"entropy_ratio":1.0,"top_rate":0.25,"top_value":"Kaka\u00f3massza, cukor, kaka\u00f3 - vaj, van\u00edlia."}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"96.0% null"}],"column":"ingredients_text_sr","extras":{"singletons":2,"top_values":[["\u0160e\u0107er, kakao masa, kakao buter, vanile.",1],["",1]]},"kind":"categorical","n":50,"n_null":48,"n_unique":2,"null_rate":0.96,"stats":{"cardinality":2,"entropy":1.0,"entropy_ratio":1.0,"top_rate":0.5,"top_value":"\u0160e\u0107er, kakao masa, kakao buter, vanile."}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_sr","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_nl_ocr_1675675383","extras":{"singletons":1,"top_values":[["Cacaomassa, suiker, cacaoboter, natuurlijk Bourbon vanille- stokje.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Cacaomassa, suiker, cacaoboter, natuurlijk Bourbon vanille- stokje."}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_with_allergens_cs","extras":{"singletons":1,"top_values":[["Kakaov\u00e1 hmota, cukr, kakaov\u00e9 m\u00e1slo, vanilka.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Kakaov\u00e1 hmota, cukr, kakaov\u00e9 m\u00e1slo, vanilka."}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"96.0% null"}],"column":"generic_name_sr","extras":{"singletons":2,"top_values":[["Tamna \u010dokolada sa 70% kakaa",1],["",1]]},"kind":"categorical","n":50,"n_null":48,"n_unique":2,"null_rate":0.96,"stats":{"cardinality":2,"entropy":1.0,"entropy_ratio":1.0,"top_rate":0.5,"top_value":"Tamna \u010dokolada sa 70% kakaa"}},{"alerts":[{"code":"null_rate","level":"warn","message":"94.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_cs","extras":{"singletons":0,"top_values":[["",3]]},"kind":"categorical","n":50,"n_null":47,"n_unique":1,"null_rate":0.94,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"96.0% null"}],"column":"product_name_sr","extras":{"singletons":2,"top_values":[["Excellence 70% Cocoa Intense Dark",1],["\u0422\u0435\u0447\u0435\u043d \u0428\u043e\u043a\u043e\u043b\u0430\u0434 \u041d\u0443\u0442\u0435\u043b\u0430",1]]},"kind":"categorical","n":50,"n_null":48,"n_unique":2,"null_rate":0.96,"stats":{"cardinality":2,"entropy":1.0,"entropy_ratio":1.0,"top_rate":0.5,"top_value":"Excellence 70% Cocoa Intense Dark"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_hu_ocr_1571428260_result","extras":{"singletons":1,"top_values":[["kaka\u00f3massza, cukor, kaka\u00f3 - vaj, term\u00e9szetes bourbon van\u00edlia. Nyomokban egy\u00e9b di\u00f3f\u00e9l\u00e9ket, tejet, sz\u00f3j\u00e1t, szez\u00e1mmagot es b\u00faz\u00e1t tartalmazhat.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"kaka\u00f3massza, cukor, kaka\u00f3 - vaj, term\u00e9szetes bourbon van\u00edlia. Nyomokban egy\u00e9b di\u00f3f\u00e9l\u00e9ket, tejet, sz\u00f3j\u00e1t, szez\u00e1mmagot es b\u00faz\u00e1t tartalmazhat."}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_hu_ocr_1571428260","extras":{"singletons":1,"top_values":[["kaka\u00f3massza, cukor, kaka\u00f3- vaj, term\u00e9szetes bourbon van\u00edlia. Nyomokban egy\u00e9b di\u00f3f\u00e9l\u00e9ket, tejet, sz\u00f3j\u00e1t, szez\u00e1mmagot es b\u00faz\u00e1t tartalmazhat.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"kaka\u00f3massza, cukor, kaka\u00f3- vaj, term\u00e9szetes bourbon van\u00edlia. Nyomokban egy\u00e9b di\u00f3f\u00e9l\u00e9ket, tejet, sz\u00f3j\u00e1t, szez\u00e1mmagot es b\u00faz\u00e1t tartalmazhat."}},{"alerts":[{"code":"null_rate","level":"warn","message":"92.0% null"}],"column":"generic_name_hu","extras":{"singletons":1,"top_values":[["",3],["Finom",1]]},"kind":"categorical","n":50,"n_null":46,"n_unique":2,"null_rate":0.92,"stats":{"cardinality":2,"entropy":0.8112781244591328,"entropy_ratio":0.8112781244591328,"top_rate":0.75,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"92.0% null"}],"column":"product_name_hu","extras":{"singletons":2,"top_values":[["",2],["Excellence 70% Cocoa Intense Dark",1],["Dark Chocolate 70% Cacao",1]]},"kind":"categorical","n":50,"n_null":46,"n_unique":3,"null_rate":0.92,"stats":{"cardinality":3,"entropy":1.5,"entropy_ratio":0.9463946303571862,"top_rate":0.5,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"96.0% null"}],"column":"ingredients_text_with_allergens_sr","extras":{"singletons":2,"top_values":[["\u0160e\u0107er, kakao masa, kakao buter, vanile.",1],["",1]]},"kind":"categorical","n":50,"n_null":48,"n_unique":2,"null_rate":0.96,"stats":{"cardinality":2,"entropy":1.0,"entropy_ratio":1.0,"top_rate":0.5,"top_value":"\u0160e\u0107er, kakao masa, kakao buter, vanile."}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_es_ocr_1548767061_result","extras":{"singletons":1,"top_values":[["Pasta de cacao, az\u00facar, manteca de cacao, emulgente: lecitina de girasol (E-322), extracto de vainilla. Cacao: 70% m\u00ednimo.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Pasta de cacao, az\u00facar, manteca de cacao, emulgente: lecitina de girasol (E-322), extracto de vainilla. Cacao: 70% m\u00ednimo."}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"product_name_xx","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"generic_name_xx","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_es_ocr_1548767061","extras":{"singletons":1,"top_values":[["Pasta de cacao, az\u00facar, manteca de cacao, emulgente: lecitina de girasol (E-322), extracto de vainilla. Cacao: 70% m\u00ednimo.  ",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Pasta de cacao, az\u00facar, manteca de cacao, emulgente: lecitina de girasol (E-322), extracto de vainilla. Cacao: 70% m\u00ednimo.  "}},{"alerts":[{"code":"null_rate","level":"warn","message":"96.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_xx","extras":{"singletons":0,"top_values":[["",2]]},"kind":"categorical","n":50,"n_null":48,"n_unique":1,"null_rate":0.96,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_xx","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_xx","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_ur","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"product_name_ur","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_he","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"2 singleton categories"},{"code":"null_rate","level":"warn","message":"96.0% null"}],"column":"product_name_he","extras":{"singletons":2,"top_values":[["\u05e0\u05d5\u05d8\u05dc\u05d4",1],["\u05ea\u05e4\u05d5\u05e6\u05d9\u05e4\u05e1 \u05e9\u05de\u05e0\u05ea \u05d1\u05e6\u05dc",1]]},"kind":"categorical","n":50,"n_null":48,"n_unique":2,"null_rate":0.96,"stats":{"cardinality":2,"entropy":1.0,"entropy_ratio":1.0,"top_rate":0.5,"top_value":"\u05e0\u05d5\u05d8\u05dc\u05d4"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_ur","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"generic_name_ur","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_he","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_he","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_ur","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"generic_name_he","extras":{"singletons":1,"top_values":[["\u05de\u05de\u05e8\u05d7 \u05d0\u05d2\u05d5\u05d6\u05d9 \u05dc\u05d5\u05d6 \u05e2\u05dd \u05e7\u05e7\u05d0\u05d5",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"\u05de\u05de\u05e8\u05d7 \u05d0\u05d2\u05d5\u05d6\u05d9 \u05dc\u05d5\u05d6 \u05e2\u05dd \u05e7\u05e7\u05d0\u05d5"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_with_allergens_he","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"3 singleton categories"},{"code":"null_rate","level":"warn","message":"94.0% null"}],"column":"nutriscore_grade_producer","extras":{"singletons":3,"top_values":[["c",1],["e",1],["b",1]]},"kind":"categorical","n":50,"n_null":47,"n_unique":3,"null_rate":0.94,"stats":{"cardinality":3,"entropy":1.584962500721156,"entropy_ratio":1.0,"top_rate":0.3333333333333333,"top_value":"c"}},{"alerts":[{"code":"long_tail","level":"info","message":"3 singleton categories"},{"code":"null_rate","level":"warn","message":"94.0% null"}],"column":"nutriscore_grade_producer_imported","extras":{"singletons":3,"top_values":[["c",1],["e",1],["b",1]]},"kind":"categorical","n":50,"n_null":47,"n_unique":3,"null_rate":0.94,"stats":{"cardinality":3,"entropy":1.584962500721156,"entropy_ratio":1.0,"top_rate":0.3333333333333333,"top_value":"c"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_el","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_with_allergens_el","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_el","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"generic_name_el","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_el","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"product_name_el","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"generic_name_th","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_de_ocr_1559410715_result","extras":{"singletons":1,"top_values":[["Kakaomasse, fettarmes Kakaopulver, Kakaobutter, Rohrzucker.\r\nKann Schalenfr\u00fcchte, Milch und Soja enthalten.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Kakaomasse, fettarmes Kakaopulver, Kakaobutter, Rohrzucker.\r\nKann Schalenfr\u00fcchte, Milch und Soja enthalten."}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_with_allergens_th","extras":{"singletons":1,"top_values":[["Cocoa solids 99%, Cocoa paste, fat-reduced cocoa, cocoa butter, demerara sugar. May contain nuts, milk and soya.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Cocoa solids 99%, Cocoa paste, fat-reduced cocoa, cocoa butter, demerara sugar. May contain nuts, milk and soya."}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_th","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"product_name_th","extras":{"singletons":1,"top_values":[["\u0e25\u0e34\u0e19\u0e14\u0e4c \u0e40\u0e2d\u0e47\u0e01\u0e40\u0e0b\u0e2d\u0e23\u0e4c\u0e41\u0e25\u0e19\u0e0b\u0e4c \u0e14\u0e32\u0e23\u0e4c\u0e01 99% \u0e42\u0e01\u0e42\u0e01\u0e49 \u0e14\u0e32\u0e23\u0e4c\u0e01 \u0e41\u0e2d\u0e1b\u0e42\u0e0b\u0e25\u0e39\u0e17 \u0e0a\u0e47\u0e2d\u0e01\u0e42\u0e01\u0e41\u0e25\u0e15",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"\u0e25\u0e34\u0e19\u0e14\u0e4c \u0e40\u0e2d\u0e47\u0e01\u0e40\u0e0b\u0e2d\u0e23\u0e4c\u0e41\u0e25\u0e19\u0e0b\u0e4c \u0e14\u0e32\u0e23\u0e4c\u0e01 99% \u0e42\u0e01\u0e42\u0e01\u0e49 \u0e14\u0e32\u0e23\u0e4c\u0e01 \u0e41\u0e2d\u0e1b\u0e42\u0e0b\u0e25\u0e39\u0e17 \u0e0a\u0e47\u0e2d\u0e01\u0e42\u0e01\u0e41\u0e25\u0e15"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_de_ocr_1548767354_result","extras":{"singletons":1,"top_values":[["Extra feine dunkle Schokolade.\r\nSchokolade enth\u00e4lt: Kakao: mind. 99%.\r\nZutaten: Kakaomasse, fettarmes Kakaopulver, Kakaobutter, Rohrzucker.\r\nKann Schalenfr\u00fcchte, Milch und Soja enthalten.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Extra feine dunkle Schokolade.\r\nSchokolade enth\u00e4lt: Kakao: mind. 99%.\r\nZutaten: Kakaomasse, fettarmes Kakaopulver, Kakaobutter, Rohrzucker.\r\nKann Schalenfr\u00fcchte, Milch und Soja enthalten."}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_th","extras":{"singletons":1,"top_values":[["Cocoa solids 99%, Cocoa paste, fat-reduced cocoa, cocoa butter, demerara sugar. May contain nuts, milk and soya.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Cocoa solids 99%, Cocoa paste, fat-reduced cocoa, cocoa butter, demerara sugar. May contain nuts, milk and soya."}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_th","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_de_ocr_1548767354","extras":{"singletons":1,"top_values":[["Extra feine dunkle Schokolade.\r\nSchokolade enth\u00e4lt: Kakao: mind. 99%.\r\nZutaten: Kakaomasse, fettarmes Kakaopulver, Kakaobutter, Rohrzucker.\r\nKann Schalenfr\u00fcchte, Milch und Soja enthalten.\r\n",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Extra feine dunkle Schokolade.\r\nSchokolade enth\u00e4lt: Kakao: mind. 99%.\r\nZutaten: Kakaomasse, fettarmes Kakaopulver, Kakaobutter, Rohrzucker.\r\nKann Schalenfr\u00fcchte, Milch und Soja enthalten.\r\n"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_de_ocr_1559410715","extras":{"singletons":1,"top_values":[["Extra feine dunkle Schokolade.\r\nSchokolade enth\u00e4lt: Kakao: mind. 99%.\r\nZutaten: Kakaomasse, fettarmes Kakaopulver, Kakaobutter, Rohrzucker.\r\nKann Schalenfr\u00fcchte, Milch und Soja enthalten.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Extra feine dunkle Schokolade.\r\nSchokolade enth\u00e4lt: Kakao: mind. 99%.\r\nZutaten: Kakaomasse, fettarmes Kakaopulver, Kakaobutter, Rohrzucker.\r\nKann Schalenfr\u00fcchte, Milch und Soja enthalten."}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_it_ocr_1559410715","extras":{"singletons":1,"top_values":[["Cioccolato amaro extra.\r\nCacao: 99% minimo.\r\nIngredienti: pasta di cacao, cacao magro, burro di cacao, zucchero grezzo di canna.\r\nPu\u00f2 contenere frutta a guscio, latte e soia.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Cioccolato amaro extra.\r\nCacao: 99% minimo.\r\nIngredienti: pasta di cacao, cacao magro, burro di cacao, zucchero grezzo di canna.\r\nPu\u00f2 contenere frutta a guscio, latte e soia."}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_it_ocr_1559410715_result","extras":{"singletons":1,"top_values":[["pasta di cacao, cacao magro, burro di cacao, zucchero grezzo di canna.\r\nPu\u00f2 contenere frutta a guscio, latte e soia.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"pasta di cacao, cacao magro, burro di cacao, zucchero grezzo di canna.\r\nPu\u00f2 contenere frutta a guscio, latte e soia."}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_fr_imported","extras":{"singletons":1,"top_values":[["1 FEUILLE PAPIER \u00c0 RECYCLER, 1 FEUILLE METAL \u00c0 RECYCLER.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"1 FEUILLE PAPIER \u00c0 RECYCLER, 1 FEUILLE METAL \u00c0 RECYCLER."}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"preparation_fr_imported","extras":{"singletons":1,"top_values":[["Produit pr\u00eat \u00e0 consommer",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Produit pr\u00eat \u00e0 consommer"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"preparation","extras":{"singletons":1,"top_values":[["Produit pr\u00eat \u00e0 consommer",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Produit pr\u00eat \u00e0 consommer"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"preparation_fr","extras":{"singletons":1,"top_values":[["Produit pr\u00eat \u00e0 consommer",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Produit pr\u00eat \u00e0 consommer"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_lc","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"product_name_lc","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_with_allergens_lc","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"generic_name_lc","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"ingredients_text_xx_debug_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"product_name_xx_debug_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"skipped","level":"info","message":"no profiler for kind=unknown"}],"column":"generic_name_xx_debug_tags","extras":{},"kind":"unknown","n":50,"n_null":0,"n_unique":null,"null_rate":0.0,"stats":{}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_fr_ocr_1561814324","extras":{"singletons":1,"top_values":[["25 % cerneaux de noix, 25 % amandes d\u00e9cortiqu\u00e9es 25 % raisins secs sultanines (raisins secs,huile de tournesol. antioxydant: anhydride lfureux), 15% canneberges, 9,8% sucre, huile de tournesol. Traces \u00e9ventuelles d'autres fruits \u00e0 coque et d'arachides. Conditionn\u00e9 sous atmosph\u00e8re protectrice.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"25 % cerneaux de noix, 25 % amandes d\u00e9cortiqu\u00e9es 25 % raisins secs sultanines (raisins secs,huile de tournesol. antioxydant: anhydride lfureux), 15% canneberges, 9,8% sucre, huile de tournesol. Traces \u00e9ventuelles d'autres fruits \u00e0 coque et d'arachides. Conditionn\u00e9 sous atmosph\u00e8re protectrice."}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_fr_ocr_1561814324_result","extras":{"singletons":1,"top_values":[["25 % cerneaux de noix, 25 % amandes d\u00e9cortiqu\u00e9es 25 % raisins secs sultanines (raisins secs,huile de tournesol. antioxydant: anhydride lfureux), 15% canneberges, 9,8% sucre, huile de tournesol. Traces \u00e9ventuelles d'autres fruits \u00e0 coque et d'arachides.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"25 % cerneaux de noix, 25 % amandes d\u00e9cortiqu\u00e9es 25 % raisins secs sultanines (raisins secs,huile de tournesol. antioxydant: anhydride lfureux), 15% canneberges, 9,8% sucre, huile de tournesol. Traces \u00e9ventuelles d'autres fruits \u00e0 coque et d'arachides."}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_fr_ocr_1624039072_result","extras":{"singletons":1,"top_values":[["Cacao, \u00e9mulsifiant (l\u00e9cithine de _soja_), vanille.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Cacao, \u00e9mulsifiant (l\u00e9cithine de _soja_), vanille."}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_fr_ocr_1624039072","extras":{"singletons":1,"top_values":[["ingr\u00e9dients : cacao, \u00e9mulsifiant (l\u00e9cithine de _soja_), vanille.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"ingr\u00e9dients : cacao, \u00e9mulsifiant (l\u00e9cithine de _soja_), vanille."}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_fr_ocr_1573108346","extras":{"singletons":1,"top_values":[["Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2- actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2- actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_fr_ocr_1566920858_result","extras":{"singletons":1,"top_values":[["Farine de bl\u00e9, sucre, beurre frais 9,5 % , oeufs entiers frais, cr\u00e8me fra\u00eeche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2 - lactylate de sodium, Esters et mono et diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides gras), prot\u00e9ines de lait, levure d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Farine de bl\u00e9, sucre, beurre frais 9,5 % , oeufs entiers frais, cr\u00e8me fra\u00eeche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2 - lactylate de sodium, Esters et mono et diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides gras), prot\u00e9ines de lait, levure d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque."}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_fr_ocr_1573107556","extras":{"singletons":1,"top_values":[["Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2- actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2- actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_fr_ocr_1573108346_result","extras":{"singletons":1,"top_values":[["Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2 - actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2 - actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_fr_ocr_1573107560_result","extras":{"singletons":1,"top_values":[["Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2 - actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2 - actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_fr_ocr_1573108349_result","extras":{"singletons":1,"top_values":[["Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2 - actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2 - actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_fr_ocr_1573108360","extras":{"singletons":1,"top_values":[["Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2- actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2- actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_fr_ocr_1573109955_result","extras":{"singletons":1,"top_values":[["Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2 - actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2 - actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_fr_ocr_1573108349","extras":{"singletons":1,"top_values":[["Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2- actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2- actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_fr_ocr_1573109955","extras":{"singletons":1,"top_values":[["Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2- actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2- actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_fr_ocr_1573107556_result","extras":{"singletons":1,"top_values":[["Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2 - actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2 - actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_fr_ocr_1573108360_result","extras":{"singletons":1,"top_values":[["Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2 - actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2 - actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_fr_ocr_1573107560","extras":{"singletons":1,"top_values":[["Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2- actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Farine de bl\u00e9, sucre, beurre frais 9,5 % , aeufs entiers frais, cr\u00e8me fraiche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2- actylate de sodium, diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque. Esters et mono gras), prot\u00e9ines de lait levure"}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_fr_ocr_1566920858","extras":{"singletons":1,"top_values":[["Farine de bl\u00e9, sucre, beurre frais 9,5 % , oeufs entiers frais, cr\u00e8me fra\u00eeche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2- lactylate de sodium, Esters et mono et diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides gras), prot\u00e9ines de lait, levure d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Farine de bl\u00e9, sucre, beurre frais 9,5 % , oeufs entiers frais, cr\u00e8me fra\u00eeche 5,5% , levure, sel, ar\u00f4mes naturels (contient alcool), gluten de bl\u00e9, poudre de lait \u00e9cr\u00e9m\u00e9, eau de vie, \u00e9mulsifiants (Mono et diglyc\u00e9rides d'acides gras, St\u00e9aroyl-2- lactylate de sodium, Esters et mono et diac\u00e9tyltartriques des mono et diglyc\u00e9rides d'acides gras), prot\u00e9ines de lait, levure d\u00e9sactiv\u00e9e, colorant (b\u00e9ta carot\u00e8ne) Traces \u00e9ventuelles de fruits \u00e0 coque."}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"generic_name_lt","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_with_allergens_ro","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"packaging_text_lt","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_lt","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"origin_lt","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"product_name_lt","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_with_allergens_lt","extras":{"singletons":1,"top_values":[["",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":""}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_fr_ocr_1713713129","extras":{"singletons":1,"top_values":[["Ingr\u00e9dients : P\u00e2te de cacao, cacao en poudre d\u00e9graiss\u00e9, beurre de cacao, sucre, lait en poudre, p\u00e2te de amandes et de noisettes, \u00e9mulsifiants (l\u00e9cithines (soja, toumesol)) et ar\u00f4me. Cacao 92% minimum. Peut contenir des traces d'autres fruits \u00e0 coque.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"Ingr\u00e9dients : P\u00e2te de cacao, cacao en poudre d\u00e9graiss\u00e9, beurre de cacao, sucre, lait en poudre, p\u00e2te de amandes et de noisettes, \u00e9mulsifiants (l\u00e9cithines (soja, toumesol)) et ar\u00f4me. Cacao 92% minimum. Peut contenir des traces d'autres fruits \u00e0 coque."}},{"alerts":[{"code":"long_tail","level":"info","message":"1 singleton categories"},{"code":"null_rate","level":"warn","message":"98.0% null"},{"code":"imbalance","level":"warn","message":"top value is 100.0% of rows"}],"column":"ingredients_text_fr_ocr_1713713129_result","extras":{"singletons":1,"top_values":[["P\u00e2te de cacao, cacao en poudre d\u00e9graiss\u00e9, beurre de cacao, sucre, lait en poudre, p\u00e2te de amandes et de noisettes, \u00e9mulsifiants (l\u00e9cithines (soja, toumesol)) et ar\u00f4me. Cacao 92% minimum. Peut contenir des traces d'autres fruits \u00e0 coque.",1]]},"kind":"categorical","n":50,"n_null":49,"n_unique":1,"null_rate":0.98,"stats":{"cardinality":1,"entropy":-0.0,"entropy_ratio":0.0,"top_rate":1.0,"top_value":"P\u00e2te de cacao, cacao en poudre d\u00e9graiss\u00e9, beurre de cacao, sucre, lait en poudre, p\u00e2te de amandes et de noisettes, \u00e9mulsifiants (l\u00e9cithines (soja, toumesol)) et ar\u00f4me. Cacao 92% minimum. Peut contenir des traces d'autres fruits \u00e0 coque."}}],"insights":{"errors":[],"insights":[{"confidence":"high","critiques":[],"evidence_keys":["column_count","row_count","nutriscore_grade","nova_groups","ecoscore_grade","food_groups","pnns_groups_2","lang","countries_lc","ecoscore_score","nutriscore_score","completeness"],"featured_charts":[{"caption":"Check how heavily the sample skews to Nutri-Score 'e' (27 of 50) versus a/b/c.","column":"nutriscore_grade","kind":"bar"},{"caption":"See the split between ultra-processed (NOVA 4) and processed (NOVA 3) products, which dominate the sample.","column":"nova_groups","kind":"donut"},{"caption":"Compare Eco-Score grade frequencies including the notable 'unknown' and 'not-applicable' buckets.","column":"ecoscore_grade","kind":"bar"},{"caption":"Confirm that biscuits/cakes and chocolate products together account for most of the sample's food categories.","column":"pnns_groups_2","kind":"bar"},{"caption":"Spot the strong French-language bias (35/50) that will affect any text-based analysis.","column":"lang","kind":"donut"}],"model":"anthropic:claude-opus-4-7","narrative":"This is a 50-row sample from Open Food Facts with 545 columns, dominated by per-language localized fields (product names, generic names, ingredient texts, packaging texts, origin) plus nutrition, scoring, and provenance metadata. The shape is extremely sparse: the vast majority of localized columns have null rates of 0.92\u20130.98, so most analytical signal lives in a small core of fields. Worth a closer look first: the Nutri-Score and NOVA distributions (the catalog skews heavily to grade 'e' and NOVA group 4), the Eco-Score grade mix, and the food_groups / pnns_groups_2 breakdown showing this sample is concentrated in chocolate and biscuit products. Also note the heavy imbalance in `lang` (70% French) and `countries_lc`, which biases any text or origin analysis. Treat the hundreds of `*_xx` / `ingredients_text_<lang>` columns as effectively empty rather than as features.","scope":"dataset","target":"__global__"},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"A categorical update_key field with only 9 distinct values across 50 rows, dominated by 'brands' at 56% (28/50) and 'sort' at 20%. The long tail mixes human-readable labels ('divinfood', 'nova-yogurts', 'germany2', 'france') with timestamp-style tokens ('key_1748337248', 'ingredients20240805'), suggesting inconsistent naming conventions for what appears to track update batches or jobs. Entropy ratio of 0.64 confirms the heavy concentration on a few keys.","role":"metadata","scope":"column","target":"update_key","treatment":"Group rare keys into 'other' or normalize naming before using as a grouping dimension."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Hierarchical product category strings (Open Food Facts style taxonomy paths), stored as comma-separated breadcrumbs. Near-unique with 45 distinct values across 50 rows and entropy ratio 0.99, and the strings appear in mixed languages (French, English, Polish, Bulgarian Cyrillic), so direct grouping will fragment. Top value covers only 4% of rows and one row is null.","role":"feature","scope":"column","target":"categories_old","treatment":"Split on commas, normalise language, and keep only the top-level taxon as a categorical feature."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.iqr","stats.skew","stats.kurtosis","stats.n_outliers"],"model":"anthropic:claude-opus-4-7","narrative":"Numeric Eco-Score rating per item, ranging from 13 to 94 with a mean of 47.7 and median of 44. The distribution is mildly right-skewed (0.31) and platykurtic (-0.79), spanning a wide IQR of 36.5 with no outliers flagged. Notably, 14% of values are null and only 31 unique scores appear across 50 rows.","role":"feature","scope":"column","target":"ecoscore_score","treatment":"Impute or flag the 14% nulls, then use as a continuous feature without transformation."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a categorical flag for environmental impact severity, but it carries no usable signal in this sample. 56% of the 50 rows are null, and the remaining 22 records all hold the empty string, leaving cardinality at 1 and entropy at 0.","role":"feature","scope":"column","target":"environment_impact_level","treatment":"Drop; the column is effectively constant and majority-null."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Finnish-language ingredient declarations, almost entirely absent: 90% of the 50 rows are null and only 4 distinct non-null values appear, two of which are empty strings. The few populated entries are verbose product ingredient lists (chocolate, wheat-based baked goods) with allergen markup, suggesting this is a localized free-text field rather than a categorical feature despite its low cardinality here.","role":"free_text","scope":"column","target":"ingredients_text_fi","treatment":"Drop or set aside; null_rate 0.9 makes it unusable as a feature without a Finnish-text NLP pipeline."},{"confidence":"high","critiques":[],"evidence_keys":["n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a flag indicating whether nutrition data was prepared, but it carries no information: only one unique value (an empty string) appears across all 48 non-null rows, with a 4% null rate. Entropy is 0 and top_rate is 1.0, so the column is constant.","role":"metadata","scope":"column","target":"nutrition_data_prepared","treatment":"Drop; constant column with no signal."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","column","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column, packaging_shapes_tags, was skipped by the profiler so no descriptive statistics are available beyond a row count of 50 and a null rate of 0. The name suggests a tag-style field listing packaging shape descriptors, likely multi-valued per row, which is probably why it was bypassed. Without unique counts or value samples, nothing further can be confirmed.","role":"free_text","scope":"column","target":"packaging_shapes_tags","treatment":"Re-profile after splitting the tag list, then one-hot or multi-label encode."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Column 'nutrient_levels_tags' was skipped by the profiler, so no statistics beyond a 50-row count and 0% null rate are available. The name suggests a list of nutrient classification tags (likely multi-valued strings like 'fat-in-low-quantity'), but uniqueness, cardinality, and value distribution are all unknown. Treat any downstream use cautiously until the column is re-profiled with list-aware parsing.","role":"feature","scope":"column","target":"nutrient_levels_tags","treatment":"Re-profile with list/tag-aware parsing, then one-hot or multi-label encode the individual tags."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","n_unique","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column packagings_materials was skipped by the profiler, so its kind is unknown and no descriptive statistics are available. We only know there are 50 rows and a 0.0 null rate; uniqueness, type, and value distribution are all missing. The name suggests structured packaging material data (likely nested or list-valued), which would explain why the profiler bailed out.","role":"other","scope":"column","target":"packagings_materials","treatment":"Inspect raw values manually and parse the nested structure before any downstream use."},{"confidence":"low","critiques":[],"evidence_keys":["column","kind","n","null_rate","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This column is named `ingredients_without_ecobalyse_ids`, suggesting it lists ingredients that lack matching identifiers in the Ecobalyse reference system. Saturn skipped profiling, so type, uniqueness, and value distribution are unknown despite a populated null_rate of 0.0 across 50 rows.","role":"other","scope":"column","target":"ingredients_without_ecobalyse_ids","treatment":"Inspect raw values manually to determine structure (likely a list) before deciding on parsing or join strategy."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Dutch-language generic product name field, likely from a food product catalog. It is largely unusable as-is: 76% of rows are null and among the 12 non-null entries, 9 are empty strings, leaving only 3 distinct real values (e.g., 'Extra fijne pure chocolade'). Cardinality is just 4 across 50 rows, so there is essentially no signal here.","role":"metadata","scope":"column","target":"generic_name_nl","treatment":"Drop, or retain only as a descriptive label \u2014 too sparse to model."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","n_unique","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'misc_tags' was skipped by the profiler, so no type inference, uniqueness count, or value statistics are available. The only confirmed signals are 50 rows with a 0.0 null rate. Without further stats, its content and structure cannot be characterized.","role":"other","scope":"column","target":"misc_tags","treatment":"Re-profile with a parser suited to this column (e.g., list/JSON tags) before deciding on use."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.entropy_ratio","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Swedish-localised product name field, populated for only 4 of 50 rows (null_rate 0.92). The 4 present values are all unique, giving maximum entropy (entropy_ratio 1.0) but no repeated category to learn from. Values like \"90% Cocoa\" and \"Dark 70%\" look English rather than Swedish, suggesting localisation is incomplete or mislabelled.","role":"metadata","scope":"column","target":"product_name_sv","treatment":"Drop or defer until localisation coverage improves; not usable as a feature at 92% null."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.mean","stats.median","stats.min","stats.max","stats.q1","stats.q3","stats.iqr","stats.std","stats.skew","stats.kurtosis","stats.n_outliers","stats.outlier_rate","stats.zero_rate"],"model":"anthropic:claude-opus-4-7","narrative":"A numeric count of scans per record, with 49 unique values across 50 rows and no nulls or zeros. The distribution is tightly clustered (median 492, IQR 217) but extremely right-skewed (skew 3.90, kurtosis 18.72) with a max of 2523 versus a Q3 of 604, producing 4 outliers (8%). The mean (577.94) sits well above the median, confirming a heavy upper tail.","role":"feature","scope":"column","target":"scans_n","treatment":"Log-transform or winsorize before modelling to tame the heavy right tail."},{"confidence":"high","critiques":[],"evidence_keys":["alerts","n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.std","stats.iqr"],"model":"anthropic:claude-opus-4-7","narrative":"Constant numeric column holding the value 996.0 across all 50 rows with no nulls. Despite being typed as numeric, the zero variance (std 0.0, iqr 0.0) and single unique value indicate this is a schema/version tag rather than a measurement. Carries no signal for modelling.","role":"metadata","scope":"column","target":"schema_version","treatment":"Drop before modelling; retain only as a provenance tag."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds Open Food Facts product URLs, one per row, with every value unique across all 50 rows (cardinality 50, entropy_ratio 1.0). The URL path embeds a product barcode plus a slugified name, so it functions as a permalink/identifier rather than a feature. No nulls, but the long_tail alert simply reflects that every row is its own category.","role":"identifier","scope":"column","target":"url","treatment":"Drop from modelling; keep as a join key or reference link to the source product page."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"The column `vitamins_tags` was skipped by the profiler, so no type, uniqueness, or distribution statistics are available beyond a row count of 50 and a null rate of 0.0. The name suggests a list-valued field enumerating vitamin identifiers (e.g., tag-style strings), but this cannot be confirmed from the evidence. Without parsing, downstream use is blocked.","role":"other","scope":"column","target":"vitamins_tags","treatment":"Re-profile after parsing as a list of tags, then one-hot or multi-hot encode."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column was skipped by the profiler (alert: \"skipped\"), so its kind is unknown and no statistics were computed beyond a row count of 50 with 0% nulls. The name suggests a debug artefact holding sorted language codes, likely a list or compound value the profiler couldn't classify. Without unique counts or value samples there is nothing further to infer.","role":"metadata","scope":"column","target":"debug_param_sorted_langs","treatment":"Drop unless you can re-profile with list/struct support; it appears to be a debug field."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Free-form packaging descriptions, likely from a food/product database (Open Food Facts style) given multilingual prefixes like 'en:', 'es:', 'pt:'. Cardinality is extreme: 41 unique values across 50 rows with entropy ratio 0.985, and the top value 'Plastique' covers only 9% \u2014 most entries are comma-separated multi-tag strings mixing languages. 12% are null, and the long_tail alert confirms there is no usable category structure as-is.","role":"free_text","scope":"column","target":"packaging","treatment":"Split on commas, normalize language prefixes, and one-hot encode the resulting material tags rather than using the raw string."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column is named \"grades\" and contains 50 rows with no nulls, but saturn skipped profiling and could not infer a kind, so no distributional stats are available. Without n_unique or value summaries, it's impossible to tell whether this holds letter grades, numeric scores, or a nested structure. The \"skipped\" alert is the key signal: something about the storage type prevented standard analysis.","role":"other","scope":"column","target":"grades","treatment":"Manually inspect a sample to determine the underlying type before deciding on a downstream encoding."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","skew","n_outliers","outlier_rate","q1","q3","iqr","n_unique","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Values are Unix epoch seconds (min 1737907641, max 1768643720) so this column is a last-modified timestamp, likely covering early 2025 through late 2025. All 50 rows are unique with no nulls, but the distribution is heavily left-skewed (skew -1.96) with 6 outliers (12%) sitting far below the q1 of 1761612624, suggesting a small tail of much older edits while most records cluster within a ~6.1M second IQR. Treat as a timestamp, not a numeric feature.","role":"timestamp","scope":"column","target":"last_modified_t","treatment":"Convert from epoch seconds to datetime and derive recency or bucketed features instead of using the raw integer."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"origin_nl appears to be a categorical attribute (likely a Dutch-language origin label) but is effectively empty in this sample. 76% of the 50 rows are null, and the remaining 12 non-null entries are all the empty string, giving a cardinality of 1 and entropy of 0. There is no usable signal here.","role":"metadata","scope":"column","target":"origin_nl","treatment":"Drop; column has no variance and is mostly null."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Language code for the allergens text, with 6 distinct values across 50 rows and a 4% null rate. The distribution is nearly bimodal between 'en' (22) and 'fr' (21), with es/de/it/pl appearing once or twice each \u2014 a language mix worth flagging before any text processing.","role":"metadata","scope":"column","target":"allergens_lc","treatment":"Use as a language filter or routing key before tokenizing the allergens text."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'states_hierarchy' was skipped by the profiler, so its kind is unknown and no descriptive statistics were computed. We can only confirm there are 50 rows with no nulls; uniqueness, type, and value distribution are unavailable.","role":"other","scope":"column","target":"states_hierarchy","treatment":"Re-profile or inspect manually to determine type before any downstream use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Japanese-language ingredients text, almost entirely absent from this sample. 98% of the 50 rows are null, and the single non-null value is an empty string, leaving cardinality at 1 and entropy at 0.","role":"free_text","scope":"column","target":"ingredients_text_ja","treatment":"Drop; the column carries no usable signal in this sample."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","n_unique","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `teams_tags` was skipped by the profiler, so its kind, uniqueness, and value distribution are unknown. Only two facts are available: 50 rows were seen and none were null. Without further stats, the content (e.g. whether it holds lists, delimited tags, or structured objects) cannot be characterised.","role":"other","scope":"column","target":"teams_tags","treatment":"Re-profile with a parser that handles this column's type before deciding on downstream use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to capture user-submitted allergen/ingredient traces, prefixed with a language code like '(en)' or '(fr)' followed by comma-separated tags such as 'en:milk,en:nuts'. With 35 unique values across 50 rows and entropy ratio 0.938, it is highly diverse; the top value '(en) ' (an empty tag list) covers only 14% and the distribution has a long tail. Notably, the language prefix is mixed (English and French) and many entries are blank tag lists, which complicates direct use as a category.","role":"free_text","scope":"column","target":"traces_from_user","treatment":"Parse the language prefix and split the tag list into a multi-hot allergen feature before modelling."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `origins_tags` was skipped by the profiler, so kind is unknown and no descriptive statistics were computed. The only confirmed signals are 50 rows present and a 0.0 null rate; uniqueness, value distribution, and data type are all unavailable.","role":"other","scope":"column","target":"origins_tags","treatment":"Re-profile with an appropriate parser (likely a list/tag field) before deciding on downstream use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column records the unit of measurement for serving quantity, almost exclusively grams ('g' at 45 of 46 non-null rows, top_rate 0.978) with a single 'ml' entry. With only 2 unique values, an 8% null rate, and entropy_ratio of 0.151, it carries almost no information.","role":"metadata","scope":"column","target":"serving_quantity_unit","treatment":"Drop or collapse to a binary flag; near-constant with negligible signal."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"The column \"vitamins_prev_tags\" was skipped by the profiler, so no type, uniqueness, or distribution stats are available. The only confirmed signals are 50 rows with a 0.0 null rate. Without further evidence the content (likely a list/array of prior tag values given the name) cannot be characterized.","role":"other","scope":"column","target":"vitamins_prev_tags","treatment":"Re-profile with a parser that handles nested/array values before deciding on use."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column is labelled ingredients_hierarchy but saturn skipped profiling it, so no type, uniqueness, or value statistics are available. The only confirmed signals are that it has 50 rows and zero nulls. Without further evidence, the structure (likely nested or list-valued, given the name) cannot be verified.","role":"other","scope":"column","target":"ingredients_hierarchy","treatment":"Re-profile with a parser that handles nested or list-valued fields before deciding on use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.mean","stats.median","stats.min","stats.max","stats.q1","stats.q3","stats.iqr","stats.std","stats.skew","stats.kurtosis","stats.n_outliers","stats.outlier_rate","stats.zero_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Numeric count of unique scans per row, with 48 distinct values across 50 records and no nulls or zeros. The distribution is heavily right-skewed (skew 3.91, kurtosis 18.71): median is 432 against a mean of 525.38, and the max of 2257 sits far beyond q3 of 560.75, producing 4 outliers (8% outlier rate). Std of 306.41 dwarfs the IQR of 198, confirming a long upper tail.","role":"feature","scope":"column","target":"unique_scans_n","treatment":"Log-transform or winsorize before modelling to tame the long upper tail."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Free-form labels/certifications column (e.g. organic, fair-trade, Triman, Green Dot) stored as comma-separated multi-label strings, often mixing English, French, Portuguese and Spanish tokens. Of 50 rows, 42 distinct values and entropy ratio 0.95 indicate near-unique combinations; the only repeated 'value' is the empty string (8 rows, 16%) on top of a 2% null rate, so roughly one in five records carries no label at all. The long_tail alert is well earned \u2014 almost every non-empty cell is its own bag of tags.","role":"feature","scope":"column","target":"labels","treatment":"Split on commas into a multi-hot tag set (normalising language variants) before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.top_rate","stats.top_value","stats.cardinality","stats.entropy_ratio","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Likely an English-language generic product name field, but it is essentially empty: the top value is the blank string at 83.7% of non-null rows, with a further 14% null. Only 7 actual product descriptions appear across 50 rows (e.g. 'Dark chocolate', 'Crackers'), all singletons, giving cardinality 8 and entropy ratio 0.37. The long_tail alert reflects that every real value occurs exactly once.","role":"free_text","scope":"column","target":"generic_name_en","treatment":"Drop or treat blanks as missing; too sparse and unique to use as a categorical feature."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","n_unique","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'weighters_tags' was skipped by the profiler, so no type, uniqueness, or value statistics are available beyond a row count of 50 and a null rate of 0.0. Without kind detection or sample values, its content and structure cannot be characterised here. The name suggests it may hold tag-like annotations, but this is not confirmed by evidence.","role":"other","scope":"column","target":"weighters_tags","treatment":"Re-profile with parsing enabled to determine type and cardinality before deciding on use."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `popularity_tags` was skipped by the profiler, so its kind is unknown and no descriptive statistics were computed. The only signals available are that 50 rows were seen with a null rate of 0.0, meaning every row carries some value. Cardinality, type, and distribution are all missing, so the column's actual content cannot be characterized from this evidence.","role":"other","scope":"column","target":"popularity_tags","treatment":"Re-profile with the appropriate parser (likely list/JSON) before deciding on downstream use."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Likely a Finnish-localized product name field, but it is essentially empty: 90% nulls and the most frequent observed value is the empty string (top_rate 0.4 of the 5 non-null entries). Among the few populated rows, the names are in English (e.g., 'Excellence: 90% cocoa Dark Supreme', 'Arriba 85% Cacao Dark Chocolate'), contradicting the _fi suffix. With only 4 unique values across 50 rows, this column carries almost no usable signal.","role":"metadata","scope":"column","target":"product_name_fi","treatment":"Drop or defer until localization coverage improves; do not use as a feature."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a French-language origin/provenance field describing where a product or its ingredients are made. The column is essentially empty: 40 of 50 rows hold the empty string and another 8% are null, leaving only 6 distinct non-blank descriptions ranging from a single country ('France') to multi-region ingredient breakdowns. Entropy ratio of 0.319 and a top_rate of 0.87 confirm the long-tail alert \u2014 almost no usable signal here.","role":"free_text","scope":"column","target":"origin_fr","treatment":"Drop or defer; too sparse and unstructured to use without targeted NER on the few populated strings."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text generic product names, predominantly French with some English entries (e.g., \"Compound Chocolate with MILK AND ALMONDS\"). The dominant value is the empty string at 21/50 (top_rate 0.4375), and combined with a 0.04 null_rate this means most rows carry no usable name. The remaining 28 unique values are nearly all singletons, producing the flagged long tail.","role":"free_text","scope":"column","target":"generic_name","treatment":"Treat empty strings as missing, then tokenize/normalize language before embedding or matching."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column records the Nutri-Score version applied to each row, and every one of the 50 records carries the value \"2023\". With cardinality 1 and entropy 0, it offers no discriminative signal in this sample.","role":"metadata","scope":"column","target":"nutriscore_version","treatment":"Drop, constant column."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column, named ingredients_without_ciqual_codes, was skipped by the profiler so no descriptive statistics are available beyond a row count of 50 and a null rate of 0. The name suggests it holds ingredient entries that lack a matching CIQUAL food-database code, likely as a list or nested structure that the profiler could not introspect. Without unique counts or value samples, nothing further can be inferred.","role":"other","scope":"column","target":"ingredients_without_ciqual_codes","treatment":"Re-profile after parsing the nested structure, or explode to a list before downstream use."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column was skipped by the profiler, so no statistics beyond row count and null rate are available. The name suggests it holds tags for manufacturing locations, likely a multi-valued or list-like field that the dissector could not classify. With 50 rows and 0% nulls reported but no uniqueness or value stats, nothing further can be inferred from the evidence.","role":"metadata","scope":"column","target":"manufacturing_places_tags","treatment":"Re-profile after parsing the tag list, then one-hot or multi-label encode top tags."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `photographers_tags` was skipped by the profiler, so no kind, uniqueness, or value statistics are available beyond a row count of 50 and a null rate of 0.0. The name suggests it holds tag annotations associated with photographers, likely a list or delimited string, but this cannot be confirmed from the evidence. No further signal is present to characterise distribution, cardinality, or content.","role":"other","scope":"column","target":"photographers_tags","treatment":"Re-profile with list/string parsing enabled before deciding on downstream handling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Polish-language packaging text field that is effectively empty: 90% of the 50 rows are null and the remaining 10% are all the empty string, giving a single observed value and zero entropy. There is no usable signal here, only nulls and blanks.","role":"metadata","scope":"column","target":"packaging_text_pl","treatment":"Drop; the column carries no information."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","n_unique","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `informers_tags` was skipped by the profiler, so no type, uniqueness, or value statistics were computed beyond a row count of 50 with 0% nulls. Without stats it's impossible to tell whether this holds scalar tags, delimited lists, or nested structures, though the plural name hints at a multi-valued tag field. Treat any interpretation as provisional until the column is re-profiled.","role":"other","scope":"column","target":"informers_tags","treatment":"Re-run profiling with parsing for list/JSON values before deciding on downstream use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"English-language ingredient lists for food products, stored as free-form text rather than a controlled vocabulary. With 36 unique values across 50 rows and entropy ratio 0.93, values are nearly all distinct; the only repeated 'value' is the empty string (9 occurrences, top_rate 0.20), and 12% are null, so roughly a third of rows carry no usable ingredient text. Content is heterogeneous \u2014 multi-sentence allergen-tagged lists, percentages, punctuation noise, and at least one junk entry ('Hhhhh').","role":"free_text","scope":"column","target":"ingredients_text_en","treatment":"Normalize, tokenize, and embed (or parse into ingredient lists) before modelling; treat empty strings as nulls."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Free-form Italian ingredient lists for food products, with 68% nulls and only 50 rows total. Of the 16 non-null entries, 5 are empty strings (top_rate 0.3125) and the remaining values are nearly all unique long product descriptions, yielding 12 distinct values and entropy_ratio 0.913. Effectively unstructured text rather than a categorical field, despite being typed as such.","role":"free_text","scope":"column","target":"ingredients_text_it","treatment":"Treat as free text: normalize empty strings to null, then tokenize/parse for allergen or ingredient extraction rather than one-hot encoding."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a German-origin flag or label, but it carries no information in this sample: 60% of rows are null and the remaining 20 rows all hold the empty string, giving a single unique value and zero entropy. There is no signal to model on here.","role":"feature","scope":"column","target":"origin_de","treatment":"Drop; constant column with majority nulls."},{"confidence":"high","critiques":[],"evidence_keys":["n_unique","null_rate","stats.min","stats.max","stats.median","stats.q1","stats.q3","stats.skew","stats.kurtosis","stats.n_outliers"],"model":"anthropic:claude-opus-4-7","narrative":"This is the NOVA food classification group (1-4 scale) indicating processing level, with 3 unique values present across 50 rows and a 4% null rate. The distribution is heavily skewed toward ultra-processed foods: median is 4.0, Q1-Q3 spans 3-4, and skew of -2.06 with kurtosis 5.65 confirms a long left tail with one outlier at the low end. Despite being numeric, only 3 of the 4 possible NOVA categories appear in this sample.","role":"feature","scope":"column","target":"nova_group","treatment":"Treat as ordinal categorical rather than continuous; impute the 4% nulls with median (4) or a missing-indicator."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Finnish-language packaging text field that is effectively empty in this sample. 90% of the 50 rows are null and the remaining 5 rows all hold the empty string, giving a single observed value and zero entropy.","role":"free_text","scope":"column","target":"packaging_text_fi","treatment":"Drop; column carries no information in this sample."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This column packs an Open Food Facts-style product completion checklist into a single comma-joined string of `en:*-completed` / `en:*-to-be-completed` tags covering nutrition, ingredients, photos, packaging, etc. With 26 unique combinations across just 50 rows (entropy ratio 0.91) and the most common state appearing only 8 times, it behaves like a long-tail composite status flag rather than a clean category. The values are clearly multi-valued \u2014 they should be split into individual status tags before any modelling.","role":"feature","scope":"column","target":"states","treatment":"Split on comma and one-hot encode each `en:*` tag instead of treating the concatenated string as a single category."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.q1","stats.q3","stats.skew","stats.std","stats.zero_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to be a per-record sum of ingredient percentages where the precise share was not specified, expressed on a 0\u2013100 scale (max 100.0, min 0.4). The distribution is heavily left-skewed (skew -1.18) with a median of 100.0 and Q3 also at 100.0, meaning at least half of the 50 rows have effectively all of their ingredient mass unspecified. Only 22 unique values across 50 rows and a mean of 79.4 confirm the concentration at the upper bound.","role":"feature","scope":"column","target":"ingredients_with_unspecified_percent_sum","treatment":"Treat as a data-quality indicator; consider binarizing (e.g. =100 vs <100) rather than using the raw left-skewed value."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'added_countries_tags' was skipped by the profiler, so no type, uniqueness, or distributional statistics are available beyond a row count of 50 and a null rate of 0.0. The name suggests it holds country tags associated with record additions, likely a list-like or multi-valued field that the profiler could not classify. Without further stats, nothing can be said about cardinality, format, or content.","role":"other","scope":"column","target":"added_countries_tags","treatment":"Inspect raw values manually and re-profile after parsing into a normalized list type."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column is a unique row identifier, with all 50 values distinct (n_unique=50, entropy_ratio=1.0) and no nulls. The values look like product barcodes (mostly 13-digit EAN/GTIN strings such as '6111242100992', with at least one shorter numeric like '20995553'), suggesting a product-level key rather than a sequential surrogate ID. The long_tail alert simply reflects that every value occurs exactly once (top_rate=0.02).","role":"identifier","scope":"column","target":"id","treatment":"Drop from modelling; retain as a join key for linking to product metadata."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'nutrient_levels' was skipped by the profiler, so its kind is unknown and no descriptive statistics are available. We only know it has 50 rows with a 0.0 null rate; uniqueness, distribution, and value structure are all missing from the evidence.","role":"other","scope":"column","target":"nutrient_levels","treatment":"Re-profile or manually inspect a sample to determine the underlying type before any downstream use."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","median","mean","skew","kurtosis","n_outliers","outlier_rate","iqr","null_rate","n_unique","n"],"model":"anthropic:claude-opus-4-7","narrative":"Values range from 1,567,543,172 to 1,610,897,644 with a median of 1,608,147,866 \u2014 consistent with Unix epoch seconds spanning roughly 2019 to early 2021, masquerading as a numeric sort key. Distribution is heavily left-skewed (skew -2.78, kurtosis 8.09) with 4 outliers (9.1%) trailing toward older timestamps, and 12% of rows are null. The tight IQR of ~6.16M seconds (~71 days) versus a 43M-second range confirms most records cluster late in the window.","role":"timestamp","scope":"column","target":"sortkey","treatment":"Convert from epoch seconds to datetime and use as a temporal feature rather than a raw numeric."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Per-row URL pointing to a 200px product front image hosted on images.openfoodfacts.org, with French/English locale suffixes embedded in the filename. All 50 rows are unique with zero nulls, so this acts as a row-level asset reference rather than a feature. The path segments encode the product barcode (e.g. 6111242100992), making this effectively a derivable identifier.","role":"identifier","scope":"column","target":"image_small_url","treatment":"Drop from modelling; retain as a fetch URL for image pipelines or extract the embedded barcode."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'packaging_recycling_tags' was skipped by the profiler, so no type, uniqueness, or value statistics are available beyond a row count of 50 and a null rate of 0.0. The name suggests it holds packaging or recyclability tags, likely a multi-valued or list-like field that the profiler could not categorise. Without parsed values, nothing can be said about cardinality, distribution, or label vocabulary.","role":"other","scope":"column","target":"packaging_recycling_tags","treatment":"Re-profile after parsing into a list or one-hot tag set before deciding on use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This is a categorical food taxonomy field using Open Food Facts-style prefixed slugs (e.g., 'en:biscuits-and-cakes'). The distribution is heavily concentrated on sweets: 'en:biscuits-and-cakes' (17/49) and 'en:chocolate-products' (16/49) together account for roughly two-thirds of non-null rows, with 11 distinct categories across 50 records and a 2% null rate. Entropy ratio of 0.74 confirms moderate concentration rather than uniform spread.","role":"feature","scope":"column","target":"food_groups","treatment":"Strip the 'en:' prefix and one-hot or target-encode; consider grouping the long tail of single-occurrence categories into 'other'."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","n_unique","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"Column 'nova_groups_markers' was skipped by the profiler, so no type, uniqueness, or distribution stats are available beyond a row count of 50 and a null rate of 0.0. The name suggests it carries NOVA food-classification group markers, likely a list or structured field that the dissector could not parse. Without parsed values, nothing further can be said about its content.","role":"other","scope":"column","target":"nova_groups_markers","treatment":"Inspect raw values manually and reparse (likely a list/struct) before deciding on use."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.top_rate","stats.top_value","stats.cardinality","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"German-language packaging description field, almost entirely unpopulated. With a 60% null rate and the empty string accounting for 19 of the 20 non-null rows (95% top_rate), only one row carries actual content (\"1 Folie aus 22 PAP zum Recyclen\"). Cardinality of 2 and entropy ratio of 0.29 confirm there is virtually no usable signal here.","role":"free_text","scope":"column","target":"packaging_text_de","treatment":"Drop; effectively empty with only one informative value."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to hold lowercase ISO language codes, with 6 distinct values across 50 rows and no nulls. The distribution is dominated by 'fr' (25) and 'en' (19), together covering 44 of 50 rows, while 'es', 'de', 'it', and 'pl' form a thin long tail. Entropy ratio of 0.63 reflects this Franco-English skew rather than a balanced multilingual mix.","role":"feature","scope":"column","target":"categories_lc","treatment":"One-hot encode, optionally collapsing rare codes (it, pl, de, es) into an 'other' bucket."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'checkers' was skipped by the profiler, so its data type and value distribution are unknown. Only the row count (50) and null rate (0.0) are reported; n_unique and all other statistics are missing. Without further inspection there is no basis to infer what this column represents.","role":"other","scope":"column","target":"checkers","treatment":"Re-profile or manually inspect the column before any downstream use."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Spanish-language packaging description, populated for almost none of the rows. 60% are null and of the 20 non-null entries, 19 are empty strings, leaving exactly one real value describing a recyclable cardboard box and plastic tray. Effective cardinality is 2 and entropy ratio is 0.29, so this column carries virtually no signal in this sample.","role":"free_text","scope":"column","target":"packaging_text_es","treatment":"Drop unless a larger sample shows meaningful Spanish text coverage."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","n_unique","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column is labelled `unknown_nutrients_tags` and was skipped by the profiler, so no descriptive statistics, uniqueness count, or value samples are available. The only confirmed signals are that all 50 rows are non-null and the column kind is reported as 'unknown'. Without further evidence its content and structure cannot be characterised.","role":"other","scope":"column","target":"unknown_nutrients_tags","treatment":"Re-profile with type inference enabled before deciding on use."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","n_unique","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `editors_tags` was skipped by the profiler, so no type, cardinality, or value statistics are available beyond a row count of 50 and a null rate of 0.0. Without sample values or a detected kind, the content and structure are unknown \u2014 the name suggests editor-assigned tags, possibly a list or delimited string, but this is not confirmed by evidence.","role":"other","scope":"column","target":"editors_tags","treatment":"Re-profile with list/string parsing enabled to determine structure before any downstream use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.std","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This is a nutrition-score warning flag indicating whether fruit/vegetable/nut content was estimated from ingredients. Every one of the 45 non-null rows holds the value 1.0, and 10% of rows are null \u2014 so the column carries no discriminative signal in this sample, only a presence/absence distinction.","role":"metadata","scope":"column","target":"nutrition_score_warning_fruits_vegetables_nuts_estimate_from_ingredients","treatment":"Drop as a feature; optionally retain a binary is_null indicator if the missingness itself is meaningful."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to be a lowercase ISO language code label, with 6 distinct values across 50 rows and one null. English and French dominate at 22 occurrences each, leaving es, de, it, and pl with just 1-2 rows combined \u2014 a near-binary distribution despite the multilingual appearance. Entropy ratio of 0.61 confirms the imbalance.","role":"label","scope":"column","target":"labels_lc","treatment":"Group rare codes (es/de/it/pl) into 'other' before stratifying or one-hot encoding."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","n_unique","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'nutriscore_data' was skipped by the profiler, so its kind, uniqueness, and value distribution are unknown. The only confirmed signals are 50 rows with a 0.0 null rate. Without further stats, the contents (likely a nested Nutri-Score payload given the name) cannot be characterised.","role":"other","scope":"column","target":"nutriscore_data","treatment":"Re-profile with nested/struct support enabled before deciding on use."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column is flagged as skipped by the profiler, so no statistics beyond row count (50) and a null rate of 0.0 were computed. The name suggests it holds tag-style annotations for additional nutritional substances, likely a delimited or list-valued field that the dissector could not type. Without unique counts or value samples, its actual content and cardinality remain unverified.","role":"other","scope":"column","target":"other_nutritional_substances_tags","treatment":"Manually inspect raw values and re-profile as a multi-label tag list before deciding to encode or drop."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_values","stats.cardinality"],"model":"anthropic:claude-opus-4-7","narrative":"Norwegian product name field (suffix _nb suggests Bokm\u00e5l locale) that is almost entirely empty: 96% null across 50 rows, leaving only 2 non-null observations with one being an empty string and the other '99% m\u00f8rk sjokolade'. With just two distinct values and effectively no signal, this column cannot support analysis as-is.","role":"metadata","scope":"column","target":"product_name_nb","treatment":"Drop unless joined to a richer localized catalog; null rate is too high to model."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column records the basis on which nutrition data is reported, and every one of the 50 rows carries the single value \"100g\". With cardinality of 1, entropy of 0, and a top_rate of 1.0, the field provides no discriminating information whatsoever.","role":"metadata","scope":"column","target":"nutrition_data_prepared_per","treatment":"Drop; constant column carries no signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Numeric product quantities stored as strings, treated here as categorical with 27 distinct values across 50 rows. The mode '100' covers 23.4% of non-nulls, but entropy ratio of 0.90 confirms a long tail with most other values appearing only once or twice. Note 6% nulls and the presence of '0' as a quantity, which may indicate missing or placeholder stock entries.","role":"feature","scope":"column","target":"product_quantity","treatment":"Cast to numeric and treat as a quantitative feature; investigate zeros and nulls before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This is a categorical column recording product type, but every one of the 50 rows holds the same value, \"food\". Cardinality is 1 and entropy is 0, so the column carries no information for modelling or segmentation.","role":"metadata","scope":"column","target":"product_type","treatment":"Drop; constant column with zero entropy."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `checkers_tags` was skipped by the profiler, so its kind is unknown and no statistics (uniqueness, value distribution, type) were computed. Only the row count (50) and null rate (0.0) are available; everything else is missing. The name suggests it may hold tag-like values associated with a checkers process, but this cannot be confirmed from the evidence.","role":"other","scope":"column","target":"checkers_tags","treatment":"Re-run profiling or manually inspect a sample before deciding how to use this column."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'nucleotides_tags' was skipped by the profiler, so no type, uniqueness, or distribution statistics are available beyond a row count of 50 and a null rate of 0.0. The name suggests it holds tag-style annotations related to nucleotides, likely a list or delimited string, but this cannot be confirmed from the evidence. No further signal is present to characterise its values.","role":"other","scope":"column","target":"nucleotides_tags","treatment":"Re-profile with list/string parsing enabled before deciding on use."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","column","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column is named languages_tags, suggesting it holds language metadata (likely tag strings such as locale codes) for each record. Saturn skipped detailed profiling, so no cardinality, distribution, or value samples are available beyond a row count of 50 and a null rate of 0.0. Without uniqueness or value stats, no surprises can be flagged.","role":"metadata","scope":"column","target":"languages_tags","treatment":"Re-profile or inspect raw values to determine structure before deciding whether to split tags and one-hot encode."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This is a low-cardinality categorical column holding lowercase language codes (fr, en, es, de, it, pl), almost certainly a detected or declared language tag. The distribution is heavily concentrated on French (23/50) and English (20/50), with the top value covering 47.9% of non-null rows and entropy ratio of 0.61. Four percent of rows are null and three languages appear only once, so any per-language analysis will be unstable beyond fr/en.","role":"feature","scope":"column","target":"traces_lc","treatment":"Keep fr/en as-is and bucket de/es/it/pl into an 'other' category before encoding."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `categories_hierarchy` was skipped by the profiler, so no type, uniqueness, or distribution stats are available. The name suggests a nested or path-like categorical structure (e.g., taxonomy levels), but this cannot be confirmed from the evidence. Only the row count (50) and null rate (0.0) are known.","role":"other","scope":"column","target":"categories_hierarchy","treatment":"Re-profile after parsing the hierarchy (e.g., split into level columns) before deciding on encoding."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"URLs pointing to small front-of-pack product images on the Open Food Facts CDN, one per row. Every one of 50 values is unique (entropy_ratio 1.0, top_rate 0.02) and there are no nulls, so this acts as a per-product asset link rather than a feature. URLs mix `front_fr` and `front_en` suffixes, hinting at a French/English language mix in the source catalogue.","role":"metadata","scope":"column","target":"image_front_small_url","treatment":"Keep as a reference link; drop from modelling or fetch the images separately for vision features."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","column"],"model":"anthropic:claude-opus-4-7","narrative":"This column was skipped by the profiler, so no statistics beyond row count and null rate are available. The name 'entry_dates_tags' suggests a composite field combining dates and tags, likely a nested or list-like structure that didn't fit a scalar type. With 50 rows and 0% nulls, every record has some value, but its shape is unknown from this evidence.","role":"other","scope":"column","target":"entry_dates_tags","treatment":"Inspect raw values and parse into separate date and tag columns before use."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'ecoscore_tags' was skipped by the profiler, so no statistics, uniqueness, or value samples are available beyond a row count of 50 and a null rate of 0.0. Based on the name alone, it likely holds Open Food Facts-style ecoscore category tags (e.g., 'en:b'), but this cannot be confirmed from the evidence. The 'skipped' alert is the key signal here and warrants a re-profile with appropriate parsing.","role":"other","scope":"column","target":"ecoscore_tags","treatment":"Re-profile with list/tag-aware parsing before deciding on encoding or drop."},{"confidence":"high","critiques":[],"evidence_keys":["n_unique","null_rate","min","max","mean","std"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a binary warning flag indicating that the fruits/vegetables/legumes share in a Nutri-Score calculation was estimated from ingredients. Every non-null value is 1.0 (n_unique=1, std=0), and 8% of rows are null, so the column carries no discriminative signal in this sample.","role":"metadata","scope":"column","target":"nutrition_score_warning_fruits_vegetables_legumes_estimate_from_ingredients","treatment":"Drop; constant value provides no information."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.mean","stats.median","stats.min","stats.max","stats.std","stats.skew","stats.kurtosis","stats.q1","stats.q3","stats.iqr","stats.zero_rate","stats.n_outliers","stats.outlier_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Counts the number of ingredients in a record that lack a CIQUAL code, so it's a data-quality feature describing how complete the ingredient mapping is. The distribution is right-skewed (skew 1.21) with a median of 3.5 but a max of 22 and one outlier; 18% of rows are already fully mapped (zero_rate 0.18). Only 15 unique values across 50 rows, so it behaves like a small ordinal count.","role":"feature","scope":"column","target":"ingredients_without_ciqual_codes_n","treatment":"Treat as a count; consider log1p or a binary 'fully mapped' flag before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.std","stats.skew","stats.iqr","stats.n_outliers","stats.outlier_rate","stats.zero_rate"],"model":"anthropic:claude-opus-4-7","narrative":"A numeric revenue feature spanning 19 to 674 with a mean of 230 and median of 233.5, suggesting per-record monetary or count values. Distribution is moderately right-skewed (0.71) with a wide IQR of 237.75 and only one outlier (2%), so spread is large but not pathological. All 50 rows are populated with no zeros and 46 unique values.","role":"feature","scope":"column","target":"rev","treatment":"Consider a log or sqrt transform before regression to tame the right skew."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.std","stats.zero_rate","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to be a count of non-nutritive (artificial) sweeteners listed in a product's ingredients. Across all 50 rows it is exactly 0, with zero_rate of 1.0 and no nulls, so it carries no information in this sample.","role":"feature","scope":"column","target":"ingredients_non_nutritive_sweeteners_n","treatment":"Drop; constant zero provides no signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.skew","stats.q1","stats.q3","stats.zero_rate","stats.n_outliers"],"model":"anthropic:claude-opus-4-7","narrative":"This is a count of ingredients on a product that lack Ecobalyse identifiers, ranging from 0 to 29 with a median of 6.5 and mean 8.16. The distribution is right-skewed (skew 1.28) with one outlier at the high end, suggesting most products have a handful of unmapped ingredients while a few have many. Only 2% are zero, meaning nearly every row has at least one ingredient missing an Ecobalyse ID \u2014 a notable data-coverage gap.","role":"feature","scope":"column","target":"ingredients_without_ecobalyse_ids_n","treatment":"Use as-is or log-transform if feeding into a regression; treat as a coverage-quality signal."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column was skipped by the profiler, so no type, uniqueness, or distribution stats are available beyond a row count of 50 and a null rate of 0.0. The name suggests it holds tags describing environmental impact levels, likely a list-valued or multi-label field that the profiler could not classify. Without parsed values there is no way to confirm cardinality, label vocabulary, or whether tags are single- or multi-valued.","role":"other","scope":"column","target":"environment_impact_level_tags","treatment":"Re-profile after parsing the tag structure (e.g., split lists) before deciding on encoding."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column is named `last_image_dates_tags`, suggesting it holds image-related dates and tags, but saturn skipped profiling so type and content cannot be confirmed. The only evidence available is 50 rows with no nulls; uniqueness, distribution, and value samples are all missing.","role":"other","scope":"column","target":"last_image_dates_tags","treatment":"Inspect raw values manually to determine structure before deciding on parsing or modelling."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column was skipped by the profiler, so its contents are uncharacterised beyond a row count of 50 and a null rate of 0.0. The name suggests a nested or structured label taxonomy, which likely tripped the profiler's type detection. No uniqueness, value, or distribution statistics are available to confirm.","role":"other","scope":"column","target":"labels_hierarchy","treatment":"Inspect raw values manually and parse the hierarchy (e.g., split on delimiter or expand JSON) before profiling again."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text English product names with 34 unique values across 50 rows and high entropy ratio (0.91), indicating heavy diversity. Notable issues: 14% nulls plus an empty-string value taking the top slot at 23.3% (10 occurrences), so effective missingness is much higher than null_rate alone suggests. Values mix languages (e.g., 'Edelbitter-Schokolade', 'Chocolat noir', 'tonik') and include junk like 'Hhhhh', flagged as long_tail.","role":"free_text","scope":"column","target":"product_name_en","treatment":"Normalise empties to null, language-detect, then tokenize/embed before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["zero_rate","median","iqr","max","mean","std","skew","kurtosis","n_outliers","outlier_rate","null_rate","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Nutri-Score warning value estimating fruit/vegetable/legume content from ingredients. The distribution is dominated by zeros (zero_rate 0.89, median and IQR both 0), with a handful of extreme values pushing the max to 50 and producing severe skew (5.93) and kurtosis (35.2). Five outliers (10.9% rate) drive the mean to 1.65 despite a std of 7.55, and 8% of rows are null.","role":"feature","scope":"column","target":"nutrition_score_warning_fruits_vegetables_legumes_estimate_from_ingredients_value","treatment":"Binarize (zero vs non-zero) or winsorize before modelling given the heavy zero mass and extreme skew."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds comma-separated allergen/ingredient trace tags with an `en:` language prefix (e.g. `en:milk,en:nuts`), so each cell is a multi-label set rather than a single category. Across 50 rows there are 23 distinct combinations and entropy ratio 0.87, indicating high diversity, and the most common value is the empty string at 22% (11 rows) \u2014 meaning missing-as-empty rather than a true null (null_rate 0.0). The long_tail alert reflects many combinations appearing only once or twice.","role":"feature","scope":"column","target":"traces","treatment":"Split on commas and multi-hot encode the individual `en:` tags; treat empty string as missing."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.entropy_ratio","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Finnish-language generic product name field, populated for only 5 of 50 rows (90% null). Among the 5 present values, all are unique with maximum entropy (2.32, ratio 1.0), and casing inconsistencies appear (\"Tumma suklaa\" vs \"tumma suklaa\") plus one empty string counted as a value.","role":"free_text","scope":"column","target":"generic_name_fi","treatment":"Normalise case and treat empty strings as null; too sparse (90% missing) to use as a feature without imputation or dropping."},{"confidence":"medium","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be original packaging or establishment codes (EMB-prefixed identifiers used on European food labels), kept in raw form. The column is sparsely populated: 34% are null and among the remaining rows the empty string dominates at roughly 85% (top_rate 0.848), leaving only 5 distinct values across 50 rows. One entry is not a code at all but a company name pair (SOLENT GMBH & CO. KG,SCHWARZ BETEILIGUNGS GMBH), suggesting inconsistent source formatting.","role":"metadata","scope":"column","target":"emb_codes_orig","treatment":"Normalise empty strings to null and parse/validate the EMB code pattern before use; too sparse to model directly."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","zero_rate","mean","median","max","skew","kurtosis","std","q3","n_outliers"],"model":"anthropic:claude-opus-4-7","narrative":"Counts the number of ingredients whose percentage is explicitly specified on a product label. The distribution is heavily zero-inflated (zero_rate 0.58) with median 0 and mean 1.1, but a long right tail reaches 8 (skew 1.88, kurtosis 3.68), and only 7 distinct values appear across 50 rows.","role":"feature","scope":"column","target":"ingredients_with_specified_percent_n","treatment":"Treat as a count feature; consider a binary 'has_specified_percent' flag plus log1p transform to tame the skew."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This is a Nutri-Score-style nutrition grade for each item, with six observed levels (a-e plus 'unknown'). The distribution is heavily skewed toward the worst grade: 'e' accounts for 27 of 50 rows (top_rate 0.54), while 'a' and 'b' together appear only 6 times. One row carries the literal value 'unknown' rather than null, so null_rate is 0.0 despite missing information.","role":"label","scope":"column","target":"nutrition_grades","treatment":"Treat as ordered categorical (a<b<c<d<e), recode 'unknown' as missing, and watch for class imbalance toward 'e'."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `weighers_tags` was skipped by the profiler, so no type, cardinality, or value statistics are available beyond a row count of 50 and a null rate of 0.0. Without `n_unique` or any sample values it is impossible to tell whether this holds tag strings, arrays, or something else. The name suggests a multi-valued tag field associated with 'weighers', which would explain why the profiler couldn't fit it into a standard kind.","role":"other","scope":"column","target":"weighers_tags","treatment":"Re-profile with array/text handling enabled to determine structure before use."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `categories_tags` was skipped by the profiler, so no type, cardinality, or distribution stats are available beyond the row count (n=50) and a null rate of 0.0. The name suggests a multi-valued tag field (e.g., comma- or colon-separated category labels), but this cannot be confirmed from the evidence. No further signal is present.","role":"other","scope":"column","target":"categories_tags","treatment":"Re-profile with parsing for delimited tag lists before deciding on encoding."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds Open Food Facts product image URLs, one per row, all pointing to front-of-package JPEGs at 400px width. Every one of the 50 values is unique (entropy_ratio 1.0, top_rate 0.02), so it functions as a per-row asset link rather than a categorical feature. URL paths mix _fr and _en locale suffixes, hinting at a multilingual product catalog.","role":"identifier","scope":"column","target":"image_url","treatment":"Drop from modelling; retain as a reference link or fetch for downstream image features."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column \"sources\" was skipped by the profiler, so its kind is unknown and no statistics (uniqueness, value distribution, type) were computed. Only two facts are available: 50 rows were seen and none were null. Without further inspection, nothing can be said about its content or structure.","role":"other","scope":"column","target":"sources","treatment":"Re-profile or manually inspect this column before any downstream use."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'languages_hierarchy' was skipped by the profiler, so no statistics are available beyond a row count of 50 and a null rate of 0. The name suggests a nested or structured representation of languages (likely a list or path-like string), but the dissector did not characterize its values. No uniqueness, length, or value-distribution signals are present to confirm.","role":"other","scope":"column","target":"languages_hierarchy","treatment":"Re-profile with a parser that handles nested/structured values before deciding on use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This is a PNNS food group classifier with 7 distinct categories and no nulls across 50 rows. The distribution is severely imbalanced: 'Sugary snacks' accounts for 76% of records, with entropy ratio just 0.48, suggesting the sample is dominated by one food type. Two rows are explicitly labeled 'unknown', and four other categories appear only once or twice each.","role":"feature","scope":"column","target":"pnns_groups_1","treatment":"One-hot encode, but expect the 'Sugary snacks' class to dominate any downstream model."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Lowercase ISO-style language or country codes with 6 distinct values across 50 rows and a 2% null rate. The distribution is heavily English-dominant (en at 28, top_rate 0.57) followed by fr at 16, leaving es/de/it/pl as singletons or near-singletons. Entropy ratio of 0.59 confirms the long tail is thin and unlikely to support per-class modelling.","role":"feature","scope":"column","target":"countries_lc","treatment":"Group rare codes into an 'other' bucket and one-hot encode; impute the 2% nulls."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `additives_tags` was skipped by the profiler, so no type, cardinality, or value statistics are available beyond a row count of 50 and a null rate of 0.0. The name suggests a list-style field enumerating food additive identifiers (e.g., E-numbers), but this cannot be confirmed from the evidence. No distributional signal is present to flag.","role":"other","scope":"column","target":"additives_tags","treatment":"Re-profile with list/string parsing enabled, then explode tags for one-hot or multi-label encoding."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","column","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"Column `codes_tags` was skipped by the profiler, so no type inference, uniqueness, or value statistics are available beyond a row count of 50 and a null rate of 0.0. The name suggests a tag or code list (likely a delimited or array-valued field), but this cannot be confirmed from the evidence. Without `n_unique` or any sampled values, no distributional claims can be made.","role":"other","scope":"column","target":"codes_tags","treatment":"Re-profile with array/string parsing enabled before deciding on a downstream transform."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"The column `countries_tags` was skipped by the profiler (kind=unknown) so no statistics were computed beyond a 50-row count with 0% nulls. Based solely on the name, it likely holds country tag strings (e.g., comma- or colon-delimited slugs), but uniqueness, cardinality, and value distribution are all unknown here. Treat any interpretation as provisional until the column is reparsed.","role":"feature","scope":"column","target":"countries_tags","treatment":"Reparse as a delimited tag list, then explode and one-hot or multi-label encode before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Usernames of the people or bots that created each record, with 13 distinct creators across 50 rows and no nulls. Two accounts dominate: 'openfoodfacts-contributors' at 46% (23 rows) and 'kiliweb' at 15 rows, together covering 76% of the column, while the remaining creators each appear once or twice \u2014 a classic long tail flagged in alerts.","role":"metadata","scope":"column","target":"creator","treatment":"Collapse rare creators into an 'other' bucket before any encoding."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column is named 'ingredients' but saturn skipped profiling it (kind=unknown, no stats computed). Across 50 rows there are zero nulls, but uniqueness, types, and value distribution are all unknown. Based on the name alone it is likely a list or free-text field of recipe components, which is why a generic profiler bailed out.","role":"free_text","scope":"column","target":"ingredients","treatment":"Parse into a list and one-hot or tokenize/embed before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","top_rate","top_value","top_values","n"],"model":"anthropic:claude-opus-4-7","narrative":"Dutch-language product names, but the column is mostly empty: 76% of rows are null and of the 12 populated rows, 6 are blank strings, leaving only 6 actual names across 7 unique values. The surviving entries are a language mix (English 'Dark absolute', French 'Tartines craquantes multi-c\u00e9r\u00e9ales', Dutch 'Volkoren cracotte'), so the field is not consistently Dutch despite its name.","role":"free_text","scope":"column","target":"product_name_nl","treatment":"Drop or defer; too sparse and linguistically inconsistent to use without upstream cleanup."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'ingredients_n_tags' was skipped by the profiler, so no statistics, uniqueness, or type information are available beyond a row count of 50 and a null rate of 0.0. The name suggests a count of ingredient tags, but this cannot be confirmed from the evidence. Without stats, any downstream assumption about its distribution or role is unsupported.","role":"other","scope":"column","target":"ingredients_n_tags","treatment":"Re-profile with type coercion to determine whether this is numeric before use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Spanish-language origin field, but it carries no usable signal in this sample. 60% of rows are null and the remaining 20 non-null entries are all the empty string, giving cardinality 1 and entropy 0.","role":"metadata","scope":"column","target":"origin_es","treatment":"Drop; the column has no variation and a 60% null rate."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","top_values","stats.top_rate","stats.top_value","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Polish-language product names, populated for only 10% of rows (null_rate 0.9) with just 3 distinct values across 50 records. The top value is the empty string at 60%, leaving only two real product names ('Czekolada gorzka 74%' and 'Excellence 70% Cocoa Intense Dark') appearing once each. Both the long_tail and null_rate alerts fire, and empty strings are being counted as a category rather than nulls.","role":"metadata","scope":"column","target":"product_name_pl","treatment":"Normalise empty strings to null and treat as a sparse localisation field; drop unless Polish-market analysis is required."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'scores' was skipped by the profiler and reports kind 'unknown', so no statistics, uniqueness, or value distribution were computed. The only confirmed signals are 50 rows and a 0.0 null rate; everything else is missing. Without type inference or sample values, the column's actual content (numeric scores, lists, structured objects) cannot be determined from this evidence.","role":"other","scope":"column","target":"scores","treatment":"Re-profile with type coercion or inspect raw values before deciding on a downstream use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Brand name of each product, with 41 distinct values across 50 rows and no nulls. The distribution is essentially flat (entropy ratio 0.97), with Lindt leading at just 8% (4 occurrences) and most brands appearing once \u2014 a long tail flagged explicitly. One value is in Arabic script (\u0639\u0631\u0628\u064a), suggesting mixed-language entries that may need normalization.","role":"feature","scope":"column","target":"brands","treatment":"Group rare brands into an 'other' bucket and normalize encodings/scripts before one-hot or target encoding."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"German-language ingredient declarations, likely scraped from product packaging (e.g. Kakaomasse, Zucker, Weizenmehl). Coverage is poor: 60% null and the most common value is the empty string (5/50, 25% of non-nulls), while the remaining 16 unique strings are essentially free text with allergen markup like _SOJA_ and _WEIZENMEHL_. Entropy ratio of 0.94 confirms each populated row is nearly unique, so this behaves as free text rather than a category.","role":"free_text","scope":"column","target":"ingredients_text_de","treatment":"Treat as free text: parse comma-separated tokens or embed; do not one-hot encode."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Norwegian Bokm\u00e5l ingredients text field, likely from a multilingual product dataset. It is effectively empty: 96% of the 50 rows are null, and the only non-null value across the remaining 2 rows is an empty string, leaving cardinality at 1 and entropy at 0.","role":"free_text","scope":"column","target":"ingredients_text_nb","treatment":"Drop; no usable signal at this sample size."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.q1","stats.q3","stats.iqr","stats.skew","stats.n_outliers","stats.outlier_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Likely a count of packaging components per product, ranging from 1 to 5 with a mean of 2.07 and median of 2. The IQR is 0 because Q1 and Q3 both equal 2, which mechanically labels nearly half the rows (outlier_rate 0.488, n_outliers 20) as outliers \u2014 a quirk of the IQR rule on a low-cardinality integer, not a data quality issue. Note the 18% null rate and only 5 distinct values across 50 rows.","role":"feature","scope":"column","target":"packagings_n","treatment":"Treat as a small-count integer feature; impute the 18% nulls and ignore the IQR-flagged outliers."},{"confidence":"high","critiques":[],"evidence_keys":["n_unique","min","max","mean","zero_rate","null_rate","n"],"model":"anthropic:claude-opus-4-7","narrative":"Binary 0/1 indicator (n_unique=2, min=0, max=1) likely flagging completion status. Only 32% of rows are marked complete (mean=0.32, zero_rate=0.68), so the negative class dominates roughly 2:1. No nulls or outliers across the 50 rows.","role":"label","scope":"column","target":"complete","treatment":"Treat as binary target; account for the 68/32 class imbalance during modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a packager/manufacturer code field from an Open Food Facts-style export, dated 2014-10-16, mixing French EMB establishment codes (e.g., 'EMB 44068A') with free-text manufacturer descriptors in multiple languages (German, Spanish). With only 50 rows, 58% are null and another 30% (15/50) are empty strings as the top value, leaving just 6 distinct non-empty entries \u2014 each appearing exactly once. Entropy ratio of 0.57 and the dominance of blanks make this column nearly unusable as-is.","role":"metadata","scope":"column","target":"emb_codes_20141016","treatment":"Drop or defer; coverage is too sparse and values too heterogeneous to feature-engineer without a dedicated parser."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","column","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'ingredients_tags' was skipped by the profiler, so no type, uniqueness, or distributional statistics are available. The only confirmed signals are 50 rows with a 0.0 null rate. The name suggests a list-valued or delimited tag field (e.g., ingredient identifiers), which would explain why standard profiling bailed out.","role":"free_text","scope":"column","target":"ingredients_tags","treatment":"Parse/explode the tag list and one-hot or embed the individual ingredients before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Japanese-language packaging text, almost entirely absent: 98% of the 50 rows are null and the single non-null value is itself an empty string, leaving cardinality at 1 and entropy at 0. There is no usable signal here for any downstream task.","role":"free_text","scope":"column","target":"packaging_text_ja","treatment":"Drop the column; it is effectively empty."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"German-language generic product name, likely a free-text label for food items (chocolates, biscuits, spreads). Coverage is poor: null_rate is 0.6 and the top value is the empty string at 12 occurrences, while the remaining 9 unique values each appear once, indicating no repetition across products. Entropy_ratio of 0.68 reflects the empty-string mass dominating an otherwise unique long tail.","role":"free_text","scope":"column","target":"generic_name_de","treatment":"Treat as free text; impute missing and normalize/tokenize before any categorical use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Likely the username or bot handle that last edited each record. One contributor, \"foodless\", dominates with 21 of 50 rows (top_rate 0.43), while the remaining 49 rows spread across 23 other editors, producing a long tail and entropy ratio of 0.77. Roughly 2% of values are null, and several handles look like apps/bots (e.g., municorn-calorie-counter-app, macrofactor) mixed with human usernames.","role":"metadata","scope":"column","target":"last_editor","treatment":"Group rare editors into an \"other\" bucket and keep as a categorical provenance feature."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","n_unique","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `minerals_prev_tags` was skipped by the profiler, so no type, cardinality, or value statistics are available beyond a row count of 50 and a null rate of 0.0. Without `n_unique` or any descriptive stats, the content and structure of this field are unknown. The name suggests it may hold prior tag annotations related to minerals, but this cannot be confirmed from the evidence.","role":"other","scope":"column","target":"minerals_prev_tags","treatment":"Re-profile with the appropriate parser (likely list/string) before deciding on downstream use."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","median","mean","skew","kurtosis","n_unique","n","null_rate","zero_rate","n_outliers","outlier_rate","q1","q3"],"model":"anthropic:claude-opus-4-7","narrative":"Values are 10-digit integers ranging from 1,639,159,016 to 1,767,675,445 with a median of 1,752,195,111 \u2014 these are Unix epoch seconds, so the column is a 'last image' timestamp spanning roughly late 2021 through 2025. All 50 rows are unique with no nulls or zeros, but the distribution is strongly left-skewed (skew -2.44, kurtosis 7.36) with 2 outliers (4%) sitting far below the bulk, indicating a few very stale records against an otherwise recent cluster.","role":"timestamp","scope":"column","target":"last_image_t","treatment":"Cast from epoch seconds to datetime and derive recency features rather than using the raw integer."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a date column marking when items became obsolete, but it carries no usable information in this sample. Across 50 rows there is a single non-null distinct value \u2014 the empty string \u2014 making up 100% of non-nulls (44 of 44), with a 12% null rate on top. Entropy is 0.0 and cardinality is 1, so the field is effectively blank.","role":"metadata","scope":"column","target":"obsolete_since_date","treatment":"Drop; the column is constant (empty) and offers no signal."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Column `pnns_groups_2_tags` was skipped by the profiler, so no statistics, uniqueness count, or value samples are available. The only confirmed signals are 50 rows present and a 0.0 null rate. The name suggests Open Food Facts PNNS group-2 category tags, typically a low-cardinality categorical, but this cannot be verified from the evidence.","role":"other","scope":"column","target":"pnns_groups_2_tags","treatment":"Re-run the profiler on this column to determine type before deciding; if categorical tags, one-hot or target-encode."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'emb_codes_tags' was skipped by saturn, so no statistics beyond row count (50) and a null rate of 0.0 are available. The name suggests it holds embossing or packaging code tags, likely a multi-valued categorical string field, but uniqueness, cardinality, and value distribution are unknown. Without further profiling no surprises can be flagged.","role":"other","scope":"column","target":"emb_codes_tags","treatment":"Re-profile with string/list parsing enabled before deciding whether to one-hot encode or drop."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a multi-country list field (likely product distribution countries from an Open Food Facts\u2013style source, captured before a scan-bot pass). With 38 unique values across 50 rows and entropy_ratio 0.965, it is nearly free-form: France leads at only 6 occurrences (top_rate 0.14), and many cells are comma-separated lists. Values mix languages (French 'Belgique', Spanish 'B\u00e9lgica', Dutch 'nl:Duitsland', English 'en:Morocco') and taxonomy-prefixed codes, plus a 14% null rate.","role":"feature","scope":"column","target":"countries_beforescanbot","treatment":"Split on comma, normalize language variants and 'xx:' prefixes to ISO country codes, then multi-hot encode."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This is the French Nutri-Score grade (a-e) for each food item, with one row coded as 'unknown'. The distribution is heavily skewed toward the worst grade: 'e' alone covers 54% of the 50 rows, and grades d+e together dominate while only 6 rows are 'a' or 'b'. Entropy ratio of 0.74 confirms moderate concentration rather than a balanced ordinal spread.","role":"label","scope":"column","target":"nutrition_grade_fr","treatment":"Treat as ordered categorical (a<b<c<d<e); map 'unknown' to NaN and watch for class imbalance toward 'e'."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'data_quality_tags' was skipped by the profiler, so no kind, uniqueness, or value statistics are available. The only confirmed signals are 50 rows with a null_rate of 0.0, meaning every row has some value, but its content and cardinality are unknown.","role":"other","scope":"column","target":"data_quality_tags","treatment":"Re-profile or manually inspect before use; the profiler skipped this column."},{"confidence":"high","critiques":[],"evidence_keys":["zero_rate","median","mean","std","max","skew","q1","q3","n_unique","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a numeric feature summing the percentages of ingredients whose proportions are explicitly disclosed (likely on food product labels). The distribution is heavily zero-inflated with a zero_rate of 0.58 and median of 0.0, while non-zero values stretch up to 99.6 with mean 22.74 and std 32.88. The right skew (0.998) and bimodal shape (q1=0, q3=52.25) suggest two regimes: products with no specified percentages and those with substantial disclosure.","role":"feature","scope":"column","target":"ingredients_with_specified_percent_sum","treatment":"Consider a hurdle approach: a binary 'has_disclosure' flag plus the continuous value, since 58% of rows are zero."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to be an origin flag for Italy, but it carries no information: of 50 rows, 68% are null and the remaining 16 non-null values are all empty strings, giving a single unique value and zero entropy. There is no signal here to model on.","role":"feature","scope":"column","target":"origin_it","treatment":"Drop; constant column with majority nulls."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column records the basis on which nutrition values are reported, taking only two values: '100g' and 'serving'. The encoding is heavily skewed, with 84% of the 50 rows using '100g' and the remaining 8 rows using 'serving', and there are no nulls. Analysts should note that nutrition figures in other columns are not directly comparable across rows without normalising to a common basis.","role":"metadata","scope":"column","target":"nutrition_data_per","treatment":"Use as a grouping flag and normalise nutrition fields to a single basis before aggregation."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be an origin-related categorical field (likely a place/location code from the column name 'origin_pl'), but it carries almost no information here. 90% of the 50 rows are null, and the remaining 5 non-null entries are all empty strings, giving cardinality 1 and entropy 0.","role":"metadata","scope":"column","target":"origin_pl","treatment":"Drop; the column is 90% null with only empty strings remaining."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","n_unique","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'product' was skipped by the profiler, so no type, cardinality, or value statistics are available beyond a row count of 50 and a null rate of 0.0. Without unique counts or sample values, the role of this column cannot be inferred from the evidence.","role":"other","scope":"column","target":"product","treatment":"Re-run the profiler on this column to obtain stats before deciding on treatment."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.cardinality","stats.entropy_ratio","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"URLs pointing to product pages, likely a manufacturer/source link field. The dominant value is the empty string at 21 of 50 rows (top_rate 0.4375), and combined with a 4% null rate this column is mostly missing. The remaining 28 unique values look like one-off product URLs across various brand domains, hence the long_tail alert and entropy ratio of 0.76.","role":"metadata","scope":"column","target":"link","treatment":"Extract domain as a low-cardinality feature; drop the raw URL as it's near-unique and mostly blank."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.entropy_ratio","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Dutch-language ingredient lists for food products, present for only 24% of the 50 rows (null_rate 0.76). Among the 12 non-null entries there are 9 distinct strings with high entropy_ratio 0.92, and the modal value is actually the empty string (4 occurrences) rather than a real ingredient list. Contents range from short declarations like 'Aardappelen, zonnebloemolie, zeezout.' to long packaging blurbs containing addresses and URLs, so the field mixes ingredients with marketing text.","role":"free_text","scope":"column","target":"ingredients_text_nl","treatment":"Treat empty strings as nulls, then tokenize and embed (or parse comma-separated ingredients) before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.skew","stats.kurtosis","stats.zero_rate","stats.n_outliers","stats.outlier_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Count of additives per product, ranging from 0 to 8 across 50 rows with no nulls and only 8 distinct values. The distribution is heavily right-skewed (skew 1.47, kurtosis 2.10) with a zero_rate of 0.4 and median of 1, while a small tail produces 2 outliers (outlier_rate 0.04). Mean (1.52) sits well above the median, confirming a few additive-heavy products pull the average up.","role":"feature","scope":"column","target":"additives_n","treatment":"Treat as a discrete count; consider log1p or binning (0 vs 1+ vs many) before modelling given the skew and high zero_rate."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.entropy_ratio","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Swedish-language generic product name, populated for only 4 of 50 rows (null_rate 0.92). The four observed values are all distinct (entropy_ratio 1.0), including one empty string, so there is effectively no usable signal here. Top value 'Fin m\u00f6rk choklad med 90% kakao' appears just once.","role":"free_text","scope":"column","target":"generic_name_sv","treatment":"Drop or defer \u2014 too sparse (92% null) and unique to model."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column was skipped by the profiler, so no statistics, uniqueness, or value samples are available beyond a row count of 50 and a null rate of 0.0. The name suggests it holds tags listing ingredients potentially derived from palm oil, likely a multi-valued/list field typical of Open Food Facts exports. Without parsed values, nothing can be said about cardinality, distribution, or content.","role":"feature","scope":"column","target":"ingredients_that_may_be_from_palm_oil_tags","treatment":"Re-profile after parsing as a list of tags, then one-hot or count-encode before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.std","stats.skew","stats.iqr","stats.zero_rate","stats.n_outliers"],"model":"anthropic:claude-opus-4-7","narrative":"A non-negative integer count of recognised ingredients per record, ranging from 0 to 36 with a mean of 11.76 and median of 9. The distribution is right-skewed (skew 0.86) with a wide IQR of 13.5, and 4% of rows are zero \u2014 meaning a small fraction had no ingredients matched at all. No outliers were flagged and there are no nulls across the 50 rows.","role":"feature","scope":"column","target":"known_ingredients_n","treatment":"Consider a log1p transform before modelling to tame the right skew."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.std","stats.skew","stats.outlier_rate","stats.n_outliers"],"model":"anthropic:claude-opus-4-7","narrative":"A numeric quality score named 'completeness', bounded loosely between 0.575 and 1.1 with mean 0.91 and median 0.9, so most rows are near-complete. The max of 1.1 is suspicious for a metric that nominally caps at 1.0, and 12% of values flag as outliers with a left skew of -0.67, suggesting a tail of poorly-populated records. Only 14 unique values across 50 rows hints at a discretised or rounded score rather than a continuous measurement.","role":"feature","scope":"column","target":"completeness","treatment":"Clip values above 1.0 and inspect the low-end outliers before using as a quality filter."},{"confidence":"high","critiques":[],"evidence_keys":["alerts","n","n_unique","stats.zero_rate","stats.std","stats.min","stats.max"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to count sweetener ingredients per record, but every one of the 50 rows holds the value 0 (zero_rate 1.0, n_unique 1, std 0.0). It carries no information for modelling and is flagged constant.","role":"feature","scope":"column","target":"ingredients_sweeteners_n","treatment":"Drop; constant column with zero variance."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds NOVA food classification groups, a 4-level ordinal scheme encoded as strings ('1' through '4'). Only 3 of the 4 possible groups appear across 50 rows, with group '4' (ultra-processed) dominating at 33/50 (top_rate 0.6875) and group '2' entirely absent. Null rate is 0.04 and entropy_ratio is 0.64, indicating concentration toward the ultra-processed end.","role":"feature","scope":"column","target":"nova_groups","treatment":"Treat as ordinal (cast to int) and impute the 4% missing before modelling."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","column","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column is labeled 'allergens_hierarchy', suggesting it holds hierarchical allergen tags (likely a list or delimited path structure). Saturn skipped profiling, so no uniqueness, cardinality, or value statistics are available beyond the fact that all 50 rows are non-null. Without parsed content, the structure and value distribution cannot be characterized.","role":"feature","scope":"column","target":"allergens_hierarchy","treatment":"Parse the hierarchy into a list, then one-hot or multi-label encode allergen tags before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"The 'obsolete' column has a single observed value\u2014an empty string\u2014across all 44 non-null rows, with the remaining 12% of rows null. Cardinality is 1 and entropy is 0, so this column carries no information as-is. The name suggests a deprecated flag, consistent with it being effectively unused.","role":"metadata","scope":"column","target":"obsolete","treatment":"Drop; constant column with no signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a source/origin indicator (likely Swedish, given the _sv suffix) but it carries virtually no information in this sample. With a 92% null rate and the only non-null value being an empty string repeated 4 times, cardinality is 1 and entropy is 0. The column is effectively constant and unusable as-is.","role":"metadata","scope":"column","target":"origin_sv","treatment":"Drop the column; it is 92% null and otherwise constant."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","n_unique","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column packaging_hierarchy was skipped by the profiler, so no type, uniqueness, or distribution stats are available. All 50 rows are non-null, but every other signal (kind, n_unique, summary stats) is missing. Without further inspection the contents and structure remain unknown.","role":"other","scope":"column","target":"packaging_hierarchy","treatment":"Re-profile or manually inspect a sample before deciding on downstream handling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.q1","stats.q3","stats.skew","stats.kurtosis","stats.n_outliers","stats.outlier_rate","stats.zero_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Likely a count of ingredients on a product whose declared percentage is unspecified, ranging from 1 to 33 with a mean of 8.8 and median of 7. The distribution is right-skewed (skew 1.64, kurtosis 3.55) with two outliers (4%) pulling the upper tail toward 33, well above the Q3 of 11. Every row has a value (null_rate 0, zero_rate 0), so no product in this sample fully discloses ingredient percentages.","role":"feature","scope":"column","target":"ingredients_with_unspecified_percent_n","treatment":"Apply a log or sqrt transform before modelling to tame the right skew."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","zero_rate","skew","kurtosis","max","mean","q3"],"model":"anthropic:claude-opus-4-7","narrative":"This is an estimated percentage of fruits, vegetables, and nuts per 100g of product. The signal is almost absent: 46% of rows are null, and of the 27 non-null values, 96.3% are zero, leaving essentially one non-zero observation at 85.0 that drives the mean of 3.15 and skew of 4.9.","role":"feature","scope":"column","target":"fruits-vegetables-nuts_100g_estimate","treatment":"Drop or collapse to a binary has_value flag; the column carries almost no variance."},{"confidence":"medium","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","stats.cardinality","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Looks like a free-form certification/packaging code field (FSC-*, EMB *, LPL.*) with mixed formats including one company-name string. The column is dominated by empty strings \u2014 35 of 50 rows (top_rate 0.73) \u2014 and has a 4% null rate on top, leaving very little signal across 11 unique values. Entropy ratio of 0.50 and the long_tail alert confirm most non-empty codes appear only once or twice.","role":"metadata","scope":"column","target":"emb_codes","treatment":"Treat empty strings as missing and consider dropping or collapsing into a binary has_code flag given the sparsity and long tail."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","column"],"model":"anthropic:claude-opus-4-7","narrative":"This column was skipped by the profiler, so no statistics are available beyond a row count of 50 and a null rate of 0.0. The name 'packagings' suggests it likely holds nested or structured packaging descriptions (lists or objects), which is consistent with the profiler classifying its kind as 'unknown' and emitting a 'skipped' alert. Without unique counts or value summaries, nothing further can be inferred.","role":"other","scope":"column","target":"packagings","treatment":"Inspect raw values and parse/normalize the structure before deciding on a downstream treatment."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","n","null_rate","column"],"model":"anthropic:claude-opus-4-7","narrative":"Profiling skipped this column, so type, uniqueness, and value distribution are unknown. The only confirmed facts are 50 rows present with a null rate of 0.0 and a name suggesting a tags-style field for purchase locations. No further signal is available to characterise content or cardinality.","role":"other","scope":"column","target":"purchase_places_tags","treatment":"Re-run profiling with parsing enabled to inspect tag values before deciding on use."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","column","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'additives_original_tags' was skipped by the profiler, so no statistics, uniqueness count, or value samples are available beyond a row count of 50 and a null rate of 0.0. Based solely on the name, it likely holds lists of food-additive tag identifiers (e.g., E-numbers) in their original locale, but this cannot be verified from the evidence.","role":"other","scope":"column","target":"additives_original_tags","treatment":"Re-run the profiler with list/tag parsing enabled, then explode tags before encoding."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Per-row URLs pointing to Open Food Foundation product front images, with locale suffixes like front_fr and front_en in the path. All 50 values are unique (entropy_ratio 1.0, top_rate 0.02) and there are no nulls, so this is effectively a 1:1 asset link rather than a feature.","role":"identifier","scope":"column","target":"image_front_url","treatment":"Treat as an asset URL: drop from modelling, or fetch images out-of-band for vision pipelines."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column was skipped by the profiler, so its kind is unknown and no descriptive statistics are available beyond a row count of 50 and a null rate of 0. The name suggests it holds tags related to data-quality bugs, likely a list or delimited string, but that structure is not confirmed by evidence. Without uniqueness, value, or length signals, no distributional claims can be made.","role":"other","scope":"column","target":"data_quality_bugs_tags","treatment":"Re-run the profiler with parsing enabled (e.g., explode tags) before deciding how to use this column."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be an origin field (likely a financial or geographic origin code) that is essentially empty. 90% of the 50 rows are null, and the remaining 5 non-null entries are all the empty string, giving a single unique value and zero entropy. There is no usable signal here.","role":"metadata","scope":"column","target":"origin_fi","treatment":"Drop; the column is 90% null and the remaining values are blank."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'images' was skipped by the profiler, so its kind is unknown and no descriptive statistics were computed. Only the row count (50) and a null rate of 0.0 are available; uniqueness, type, and value distribution are all missing. The name suggests binary or path-like image payloads, which would explain why the dissector bypassed it.","role":"other","scope":"column","target":"images","treatment":"Inspect raw values manually to confirm format, then route to an image-processing pipeline rather than tabular modelling."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'ingredients_analysis' was skipped by the profiler, so no type, uniqueness, or distribution statistics are available. The only confirmed signals are 50 rows present and a 0.0 null rate. Without further inspection, its content and structure remain unknown.","role":"other","scope":"column","target":"ingredients_analysis","treatment":"Inspect raw values manually to determine type before any downstream use."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","top_values","stats.top_value","stats.top_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Polish-language ingredient text with embedded allergen HTML markup, almost entirely absent from this sample. 92% of 50 rows are null and only 3 distinct values appear, two of which are unique product descriptions and one is an empty string (top_rate 0.5 among non-nulls).","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_pl","treatment":"Drop for modelling given 92% nulls; if retained, strip HTML allergen tags and treat as free text."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.entropy_ratio","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"German-language product names, almost certainly the localized display label for food/confectionery items (chocolate, biscuits, Nutella). 60% of rows are null and the top non-null value is an empty string occurring 5 times, so effectively only ~15 distinct names cover 50 rows. Entropy ratio of 0.935 confirms the populated values are nearly all unique, and at least one entry ('Lightly Sea Salted') is English rather than German.","role":"free_text","scope":"column","target":"product_name_de","treatment":"Treat as free text: normalize empty strings to null, then tokenize/embed if used as a feature."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Norwegian-language ingredients text field with allergen annotations, likely a localized variant of a product description column. It is effectively empty: 96% of rows are null and the only non-null value across the remaining 2 records is an empty string, giving a single unique value and zero entropy.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_nb","treatment":"Drop; the column carries no information at this sample size."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","top_rate","top_value","top_values","stats.cardinality"],"model":"anthropic:claude-opus-4-7","narrative":"Italian-language packaging description text, almost entirely absent from this sample. 68% of rows are null and of the 16 non-null entries, 14 are empty strings, leaving only 2 substantive Italian descriptions of recycling instructions. With cardinality of 3 and a top_rate of 0.875 on the empty string, this column carries virtually no usable signal here.","role":"free_text","scope":"column","target":"packaging_text_it","treatment":"Drop unless joined with a much larger Italian-locale slice; too sparse to model."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Italian-language product name field, mostly empty: 68% of the 50 rows are null and the modal non-null value is the empty string \"\" (5 occurrences, top_rate 0.3125). Among the 12 distinct values the names are heterogeneous chocolate and snack labels (e.g. \"Fondente Prodigioso 90% Cacao\", \"Pringles classiche 175 gr\", \"Milka\"), with case-variant duplicates like \"cioccolato fondente\" vs \"Cioccolato fondente\" inflating cardinality. Entropy ratio 0.913 confirms the non-null tail is essentially flat, each name appearing once.","role":"free_text","scope":"column","target":"product_name_it","treatment":"Normalise case/whitespace, treat empty strings as null, then tokenize and embed; not usable as a categorical feature given 68% nulls."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Numeric serving sizes stored as strings, with 27 distinct values across 50 rows and a 12% null rate. The distribution is long-tailed: top values \"100\" and \"10\" each cover only 7 records (top_rate 0.159), entropy_ratio is 0.909 indicating values are spread almost uniformly, and outliers like \"1000\" and decimals like \"11.5\" sit alongside round numbers.","role":"feature","scope":"column","target":"serving_quantity","treatment":"Cast to numeric, impute the 12% nulls, and consider log-transforming before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Japanese product name field that is effectively empty in this sample: 98% of the 50 rows are null and the single non-null value is itself the empty string, leaving cardinality at 1 and entropy at 0. There is no usable signal here whatsoever.","role":"metadata","scope":"column","target":"product_name_ja","treatment":"Drop the column; it is 98% null with a single empty-string value."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","top_value","top_values","stats.top_rate","stats.entropy_ratio"],"model":"anthropic:claude-opus-4-7","narrative":"Swedish-language ingredient lists with embedded HTML allergen markup (<span class=\"allergen\">\u2026</span>), likely the Swedish localisation of a product ingredients field. Coverage is extremely poor: 92% null and only 4 distinct values across 50 rows, with the top value appearing just once (top_rate 0.25 over the non-null subset). One value is an empty string and others mix Swedish with Danish/Norwegian terms (HVEDEMEL, BYG, EGG), indicating inconsistent locale handling.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_sv","treatment":"Strip HTML tags and parse allergen spans separately; given 92% nulls, do not use as a primary feature."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Column `allergens_tags` was skipped by the profiler, so no type, uniqueness, or value statistics are available beyond a row count of 50 and a null rate of 0.0. The name suggests a multi-valued tag field listing allergens (e.g., milk, nuts), but this cannot be verified from the evidence. Re-profile with list/string handling enabled to learn cardinality and tag distribution.","role":"feature","scope":"column","target":"allergens_tags","treatment":"Re-profile with tag-aware parsing, then one-hot or multi-hot encode the individual allergen tokens."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.entropy_ratio","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This is the French-language ingredients list for food products, stored as free-form text. Of 50 rows, 47 are unique and entropy ratio is 0.998, so values are essentially all distinct long strings; 4% are null and the most common value is an empty string (2 occurrences). Contents range from a two-word 'Eau de source' to multi-sentence ingredient declarations with percentages, allergens and additive codes.","role":"free_text","scope":"column","target":"ingredients_text_fr","treatment":"Tokenize and embed (or extract structured ingredient/allergen features) rather than treating as a category."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","min","max","zero_rate","skew","kurtosis","n_outliers","std"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a beverage-specific nutrition score, encoded as a numeric flag rather than a continuous metric: only 2 unique values across 50 rows, with min 0 and max 1. The distribution is overwhelmingly zero (zero_rate 0.98), leaving a single outlier at 1 that drives the extreme skew (6.86) and kurtosis (45.02). Effectively a near-constant indicator column.","role":"feature","scope":"column","target":"nutrition_score_beverage","treatment":"Treat as a binary flag, or drop as near-constant since 98% of rows share one value."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","column","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column was skipped by the profiler, so no statistics beyond row count (50) and null rate (0.0) are available. The name suggests it holds debug-only ingredient identifiers, likely a complex or nested structure that the dissector could not categorize. Without unique counts or value samples, its content and utility cannot be assessed here.","role":"other","scope":"column","target":"ingredients_ids_debug","treatment":"Drop unless a downstream consumer specifically needs the raw debug payload."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a flag indicating whether nutrition data is present, with the only observed value being \"on\" across all 49 non-null rows. Cardinality is 1 and entropy is 0, so the column carries no discriminative information; one row (2%) is null.","role":"metadata","scope":"column","target":"nutrition_data","treatment":"Drop, constant column with no variance."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Japanese-language origin field, likely a localized counterpart to a primary origin column. It is effectively empty: 98% of the 50 rows are null and the only non-null value is itself the empty string, yielding a single unique value and zero entropy.","role":"metadata","scope":"column","target":"origin_ja","treatment":"Drop; the column carries no information."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"English-language packaging descriptions, likely free-text recycling instructions scraped from product labels. Of 50 rows, 14% are null and another 39 (top_rate 0.91) are empty strings, leaving only 4 rows with actual content across 5 unique values. Entropy ratio of 0.27 confirms the column is almost entirely uninformative as-is.","role":"free_text","scope":"column","target":"packaging_text_en","treatment":"Drop or defer; coverage is too sparse to model, but if retained treat empty strings as nulls and tokenize the remainder."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.zero_rate","stats.mean","stats.median","stats.q1","stats.q3","stats.max","stats.min","stats.skew","stats.kurtosis","stats.n_outliers","stats.outlier_rate","stats.std"],"model":"anthropic:claude-opus-4-7","narrative":"This is a count of unrecognised ingredients per row, ranging from 0 to 13 with a mean of 0.66. The distribution is dominated by zeros (zero_rate 0.84) with median, q1, and q3 all at 0, but a long right tail produces extreme skew (4.24) and kurtosis (18.32), with 8 outliers (16%) pulling the max to 13. Effectively a sparse anomaly indicator rather than a continuous count.","role":"feature","scope":"column","target":"unknown_ingredients_n","treatment":"Binarise (zero vs non-zero) or cap before modelling; raw values are too skewed for linear models."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","n_unique","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column, named ingredients_from_palm_oil_tags, was skipped by the profiler so no distribution, uniqueness, or value-level statistics are available. The only confirmed signals are 50 rows and a 0.0 null rate; everything else (kind, n_unique) is missing.","role":"other","scope":"column","target":"ingredients_from_palm_oil_tags","treatment":"Re-profile with type coercion before deciding; likely a list/tag field needing parsing and one-hot or multi-label encoding."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","n_unique","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `labels_tags` was skipped by the profiler, so its kind, cardinality, and value distribution are all unknown. The only confirmed facts are that it contains 50 rows with no nulls. The name suggests a labels or tags field, likely multi-valued or delimited text, but no evidence confirms that.","role":"other","scope":"column","target":"labels_tags","treatment":"Re-profile with a parser that handles list/tag-style values before deciding on use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Pre-taxonomy packaging descriptions captured as free text, mixing languages (French, Spanish, English, German) and multi-value comma-separated lists. With 36 unique values across 38 non-null rows and entropy ratio 0.99, the field is almost fully unique; even the top value 'plastique' covers only 7.9% and 24% are null. Values combine material terms, language prefixes like 'fr:'/'en:', and counts ('20 biscuits en 4 sachets'), so it behaves more like free text than a category.","role":"free_text","scope":"column","target":"packaging_old_before_taxonomization","treatment":"Normalise and split on commas, then map tokens to a controlled packaging taxonomy before use."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Norwegian Bokm\u00e5l packaging text field, but it is effectively empty: 96% of 50 rows are null and the only 2 non-null values are blank strings, yielding cardinality 1 and entropy 0.","role":"free_text","scope":"column","target":"packaging_text_nb","treatment":"Drop; the column carries no information."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","column","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column was skipped by the profiler, so no statistics beyond a 50-row count and zero null rate are available. The name nutrition_grades_tags suggests categorical tags (likely Nutri-Score letters such as a-e) from an Open Food Facts-style source, but uniqueness, frequencies, and value examples are all missing. Treat any interpretation as provisional until the column is reprofiled.","role":"other","scope":"column","target":"nutrition_grades_tags","treatment":"Reprofile with categorical parsing enabled before deciding on encoding."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column was skipped by the profiler, so no type, uniqueness, or distribution stats were computed beyond a 50-row count and 0% null rate. The name 'category_properties' suggests it holds nested or structured per-category attributes (likely dict/list/JSON), which is why saturn flagged it as unknown rather than a scalar kind.","role":"other","scope":"column","target":"category_properties","treatment":"Inspect raw values and, if structured, flatten or JSON-normalize into separate columns before profiling again."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.std","stats.skew","stats.kurtosis","stats.zero_rate","stats.n_outliers","stats.q1","stats.q3"],"model":"anthropic:claude-opus-4-7","narrative":"This is the Nutri-Score numeric grade (typically -15 best to 40 worst), here ranging 0 to 40 with a mean of 17.47 and median of 19. The distribution is roughly symmetric (skew -0.16, kurtosis -0.53) with no outliers flagged, and 8.2% of values are exactly zero. Only 2% are null and 28 unique values across 50 rows, so the column is well populated and reasonably varied.","role":"feature","scope":"column","target":"nutriscore_score","treatment":"Use directly as a numeric feature; impute the 2% nulls with the median."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'packaging_tags' was skipped by the profiler, so no type, uniqueness, or distributional statistics are available beyond a row count of 50 and a null rate of 0.0. The name suggests it holds packaging-related tags, likely a multi-valued or list-like field that the profiler could not classify. Without parsed values we cannot confirm cardinality, delimiter, or language.","role":"other","scope":"column","target":"packaging_tags","treatment":"Re-profile after parsing the tag list (e.g., split on delimiter) before deciding on encoding."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Legacy multi-label tags for products, stored as comma-separated strings mixing French, English, Polish, Bulgarian (Cyrillic), and namespaced codes like 'en:CE'. With 38 uniques across 50 rows, an 8% null rate, and the most common value being the empty string at 19.6%, the field is sparse and nearly free-form. Entropy ratio 0.93 and the long_tail alert confirm almost every non-empty value is singleton.","role":"free_text","scope":"column","target":"labels_old","treatment":"Split on commas, normalise language/namespace prefixes, and one-hot the resulting tag tokens rather than treating the raw string as a category."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text packaging descriptions, mostly in French with some English mixed in, detailing materials and recycling instructions. The dominant value is an empty string at 75% (36 of 50 rows), and only 13 unique values exist with entropy ratio 0.46, so signal is sparse and long-tailed. Among non-empty entries, formats vary widely (multi-line itemized lists, comma-separated tags, uppercase marketing strings), suggesting no controlled vocabulary.","role":"free_text","scope":"column","target":"packaging_text","treatment":"Normalise case/whitespace and parse material keywords into multi-hot features; treat empty string as missing."},{"confidence":"high","critiques":[],"evidence_keys":["n_unique","null_rate","min","max","mean","median","q1","q3","iqr","skew","kurtosis","n_outliers","outlier_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a binary status flag for ingredient percent analysis, taking only 2 unique values (1.0 and -1.0) across 50 rows with no nulls. The distribution is heavily dominated by 1.0 (median, q1, q3 all 1.0; mean 0.84), with 4 outliers (8%) at -1.0 producing extreme negative skew (-3.10) and high kurtosis (7.59). Despite the numeric kind, the IQR of 0 and only two unique values indicate this is categorical rather than continuous.","role":"feature","scope":"column","target":"ingredients_percent_analysis","treatment":"Recode as a categorical/boolean flag rather than treating as continuous numeric."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'ecoscore_data' was skipped by the profiler, so no type, uniqueness, or distribution stats are available. Only the row count (50) and a null rate of 0.0 are reported. The name suggests it holds Eco-Score payloads, likely a nested/structured object that the profiler could not introspect.","role":"other","scope":"column","target":"ecoscore_data","treatment":"Inspect raw values and parse the nested structure into typed sub-fields before use."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_values","top_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Swedish-language ingredient lists for food products, free-text rather than truly categorical. Coverage is extremely sparse: 92% null with only 4 distinct values across 50 rows, one of which is an empty string. The non-null entries are full ingredient declarations including allergen markers and bilingual Swedish/Danish/Norwegian terms.","role":"free_text","scope":"column","target":"ingredients_text_sv","treatment":"Treat as free text; given 92% nulls, drop or use only as a fallback to other-language ingredient columns."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'brands_tags' was skipped by the profiler, so no type, uniqueness, or distribution statistics are available beyond a row count of 50 and a null rate of 0.0. The name suggests it holds brand tag strings (likely slug-style identifiers, possibly multi-valued), but this cannot be confirmed from the evidence. Treat any downstream assumption with caution until the column is re-profiled.","role":"other","scope":"column","target":"brands_tags","treatment":"Re-profile or sample the raw values before deciding; if multi-valued tag strings, split and one-hot or embed."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Holds an Open Food Facts category taxonomy code (e.g., 'en:dark-chocolate-bar-with-more-than-70-cocoa') used as a comparison reference. With 35 unique values across 50 rows and entropy ratio 0.95, the column is extremely diffuse \u2014 the modal category covers only 10% of rows and a long tail dominates. No nulls, but the high cardinality relative to sample size will make this hard to use as-is.","role":"metadata","scope":"column","target":"compared_to_category","treatment":"Roll up to a coarser taxonomy level (e.g., chocolate/biscuits/dairy) before any grouping or modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column records the set of apps/databases that contributed each product's data, stored as a comma-separated list rather than a normalized relation. With 43 unique strings across 50 rows (entropy ratio 0.98) and the most common combination appearing only 4 times (top_rate 0.08), nearly every row has a bespoke source bundle. Notable: the values mix case ('yuka' vs 'Yuka') and overlap heavily on 'App - smoothie-openfoodfacts' and 'Apps', suggesting the same sources are repeatedly concatenated in different orders.","role":"metadata","scope":"column","target":"data_sources","treatment":"split on commas, normalize case, and one-hot encode individual sources instead of treating the raw string as a category."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column, `other_nutritional_substances_prev_tags`, was skipped by the profiler, so no statistics on uniqueness, distribution, or content are available. The only signals are that all 50 rows are non-null and the kind is unknown. Without further evidence the contents cannot be characterised; the name suggests a tag list referencing prior values of a nutritional-substances field.","role":"other","scope":"column","target":"other_nutritional_substances_prev_tags","treatment":"Re-profile with parsing enabled (likely a delimited tag list) before deciding on use."},{"confidence":"high","critiques":[],"evidence_keys":["n_unique","stats.min","stats.max","stats.mean","stats.zero_rate","stats.iqr","stats.n_outliers","null_rate","stats.skew"],"model":"anthropic:claude-opus-4-7","narrative":"This is effectively a binary indicator counting palm-oil-derived ingredients per product, stored as numeric with values only 0 or 1 (n_unique=2, max=1.0). The column is heavily zero-dominated (zero_rate \u2248 0.85) with mean \u2248 0.152, and the 7 ones get flagged as outliers because the IQR is 0. Null rate is 8%, modest but worth noting.","role":"feature","scope":"column","target":"ingredients_from_palm_oil_n","treatment":"Recast as a boolean palm-oil flag and impute the 8% nulls before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.skew","stats.iqr","stats.outlier_rate","stats.n_outliers","stats.zero_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Values are unique 10-digit integers in the ~1.74e9\u20131.77e9 range, which is the Unix-epoch band for early 2025 through late 2025, consistent with the column name suggesting a 'last updated' timestamp. The distribution is heavily left-skewed (skew -1.94) with 12% flagged as outliers \u2014 a handful of much older updates pulling the tail down while most rows cluster within a ~6.1M-second IQR (~71 days). No nulls or zeros.","role":"timestamp","scope":"column","target":"last_updated_t","treatment":"Cast from Unix seconds to datetime and derive recency features rather than using the raw integer."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This looks like a debug/diagnostic field for a nutrition scoring pipeline, capturing which input nutrients were missing during computation. It is overwhelmingly empty: 49 of 50 rows (top_rate 0.98) hold an empty string, with only one row carrying a substantive message about missing saturated-fat, sugars, and sodium. Entropy of 0.14 confirms near-zero information content in this sample.","role":"metadata","scope":"column","target":"nutrition_score_debug","treatment":"Drop from modelling; retain only for pipeline debugging."},{"confidence":"medium","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.median","stats.iqr","stats.skew","stats.kurtosis","stats.n_outliers","stats.outlier_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Values cluster tightly between 23.999B and 24.000B with an IQR of only ~400K, yet the minimum drops to ~22.9999B, producing severe negative skew (-2.67) and 5 low-side outliers (10%). With 49 unique values across 50 rows and no nulls, this looks like an opaque high-magnitude key or encoded rank rather than a true numeric measure.","role":"identifier","scope":"column","target":"popularity_key","treatment":"Treat as an identifier and exclude from numeric modelling; join on it if it links to another table."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Spanish-language product names, evidently a localized label field paralleling a primary product identifier. With null_rate 0.6 and 4 of the 20 non-null entries being empty strings, only ~16 rows carry usable text; among those, near-uniqueness is extreme (17 distinct values, entropy_ratio 0.96). Values mix branded items (Nutella Biscuits, Excellence 85% cacao) with generic descriptors (Original, Chocolate negro 85% cacao), so it behaves more like free text than a controlled vocabulary.","role":"free_text","scope":"column","target":"product_name_es","treatment":"Treat empty strings as nulls and tokenize/embed if used as a feature; otherwise drop given 60% missingness and high cardinality."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"User-submitted allergen tags prefixed with a language code like (fr), (en), (es). 34 distinct values across 50 rows with high entropy ratio 0.9112064098150886, and the top value '(fr) ' (rate 0.16) is just an empty language tag, as is '(en) ' at 7 occurrences. Values mix languages and free-form casing (e.g. 'Gluten,Lait,Soja, en:gluten' alongside normalised 'en:gluten'), so the same allergen appears under multiple spellings.","role":"free_text","scope":"column","target":"allergens_from_user","treatment":"Strip the language prefix, split on commas, and normalise tokens to the en: namespace before using as multi-label features."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'informers' was skipped by the profiler, so its kind is unknown and no descriptive statistics were computed. The only confirmed signals are 50 rows with no nulls; uniqueness, type, and value distribution are all missing from the evidence.","role":"other","scope":"column","target":"informers","treatment":"Re-profile or manually inspect the raw values before deciding on any downstream handling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This is a legacy brand-name field for product records, with 29 distinct values across 50 rows and 32% nulls. The distribution is nearly flat (entropy_ratio 0.98) and the top brand 'Gerbl\u00e9' covers only ~8.8% of non-null rows, so no brand dominates. Values mix clean names (Lindt, Cristaline) with concatenations like 'Wasa,Barilla' and oddities like 'LuMondelez', suggesting prior data-entry or merge artefacts.","role":"metadata","scope":"column","target":"brands_old","treatment":"Clean and split multi-brand strings, then reconcile against a canonical brand list before use."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","n_unique","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"Profiling was skipped for this column, so no type, uniqueness, or value statistics are available. The only confirmed signals are 50 rows and a 0.0 null rate; everything else is missing. The name suggests it carries tags describing data-quality errors, likely a list or delimited string, but that is not verified by evidence.","role":"other","scope":"column","target":"data_quality_errors_tags","treatment":"Re-run profiling with list/string parsing enabled before deciding how to use it."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text ingredient lists from food packaging, one per row. Every one of the 50 rows is unique (entropy_ratio 1.0, top_rate 0.02) and the samples mix multiple languages (English, French, Bulgarian Cyrillic) with punctuation, percentages, and allergen notes. Treating this as a categorical feature is misleading despite the kind tag \u2014 it is unstructured multilingual prose flagged long_tail.","role":"free_text","scope":"column","target":"ingredients_text","treatment":"Parse and tokenize (language-detect first), then embed or extract ingredient entities before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds Open Food Facts-style hierarchical category breadcrumbs, with each value a comma-separated taxonomy path from broad ('Snacks') to specific ('Chocolat noir en tablette extra d\u00e9gustation \u00e0 70% de cacao minimum'). It is nearly unique (46 distinct values across 50 rows, top_rate just 0.06, entropy_ratio 0.99) and mixes French and English labels for overlapping concepts (e.g. 'Snacks sucr\u00e9s' vs 'Sweet snacks', 'Chocolats noirs' vs 'Dark chocolates'), which the long_tail alert flags. Treat as a multi-label taxonomy rather than a flat category.","role":"feature","scope":"column","target":"categories","treatment":"Split on commas, normalize French/English synonyms, and one-hot or embed the resulting taxonomy tags rather than using the raw string."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.zero_rate","stats.median","stats.q3","stats.max","stats.skew","stats.kurtosis","stats.n_outliers","stats.outlier_rate","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be an estimated percentage of fruits/vegetables/nuts content derived from ingredients, used in nutrition score warnings. The distribution is dominated by zeros (zero_rate 0.71) with median 0.0 and Q3 only 2.33, yet a long tail pushes max to 100.0, producing extreme skew (5.41) and kurtosis (30.37). Seven outliers (15.6%) and a 10% null rate further indicate this signal fires for only a small subset of products.","role":"feature","scope":"column","target":"nutrition_score_warning_fruits_vegetables_nuts_estimate_from_ingredients_value","treatment":"Binarize (zero vs non-zero) or log1p-transform before modelling given the heavy zero mass and skew."},{"confidence":"high","critiques":[],"evidence_keys":["n_unique","min","max","zero_rate","skew","null_rate","mean"],"model":"anthropic:claude-opus-4-7","narrative":"Likely a count of ingredients sourced from or potentially from palm oil per product. With only 3 unique values ranging 0\u20132 and 70.2% zeros, most products contain none, while the right skew (1.39) reflects a small tail with one or two such ingredients. Null rate is modest at 6%.","role":"feature","scope":"column","target":"ingredients_from_or_that_may_be_from_palm_oil_n","treatment":"Treat as a low-cardinality ordinal count; impute missing as 0 or add a missing flag before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Legacy free-text origin field, likely superseded (note the `_old` suffix). Of 50 rows, 22% are null and another 31 are empty strings, so the top_rate of 0.795 is dominated by blanks; only 9 distinct values exist and the non-empty entries mix country names ('France', 'Morocco'), multi-region comma lists, and noise like 'biologique' or 'Farine de bl\u00e9: France'. Entropy ratio 0.425 confirms most signal is absent, and the inconsistent formats mean this cannot be used as a clean categorical without parsing.","role":"metadata","scope":"column","target":"origins_old","treatment":"Drop or archive; if needed, parse non-empty strings into a normalised origins list and prefer the replacement column."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Dutch-language packaging text field (likely from Open Food Facts or similar). 76% of the 50 rows are null, and every one of the 12 non-null values is the empty string, giving cardinality 1 and entropy 0. The column carries no usable signal in this sample.","role":"free_text","scope":"column","target":"packaging_text_nl","treatment":"Drop; column is effectively empty (null or blank in all rows)."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This is an expiration_date field captured as free-form text rather than a parsed date. With 34 unique values across 50 rows and a top_rate of 0.3125 driven by an empty string, roughly 31% of entries are blank (plus a 4% null_rate), and the remaining values mix incompatible formats like '31/07/2020', '28/02/24', '25.11.2025', '01/2018', '19-10-2023', and even non-date tokens like '30days'.","role":"metadata","scope":"column","target":"expiration_date","treatment":"Normalise to ISO dates with multi-format parsing and treat blanks/'30days' as missing before use."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'selected_images' was skipped by the profiler, so no type, cardinality, or distribution stats are available beyond a row count of 50 and a null rate of 0.0. The name suggests it holds image references or selections (filenames, URLs, or arrays), but this cannot be confirmed from the evidence. Without n_unique or value samples, no further characterisation is possible.","role":"other","scope":"column","target":"selected_images","treatment":"Inspect raw values manually to determine structure before deciding on parsing, exploding, or dropping."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Allergen trace declarations parsed from product ingredient lists, recorded as free-form comma-separated allergen names. 78% of the 50 rows (39) are empty strings rather than nulls, and the remaining 11 distinct values mix languages (French '\u0153uf', 'lait', English 'nuts, milk', German 'Schalenfr\u00fcchte') and inconsistent casing, with some entries duplicating the same allergens twice in one string.","role":"free_text","scope":"column","target":"traces_from_ingredients","treatment":"Normalise case, split on commas, translate to a canonical allergen vocabulary, and treat empty strings as missing before one-hot encoding."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text ingredient lists with embedded HTML <span class=\"allergen\"> markup highlighting allergens. All 50 rows are unique (entropy_ratio 1.0, top_rate 0.02) and the language mix spans English, French, and Bulgarian Cyrillic, so any naive categorical encoding will explode. The HTML tags and multilingual content mean raw values need cleaning before NLP use.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens","treatment":"Strip HTML tags, language-detect, then tokenize/embed; do not treat as a category."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds Open Food Facts thumbnail URLs pointing to product front images, embedding the product barcode and a language suffix (front_fr/front_en) in the path. Every one of the 50 rows is unique with zero nulls, so it functions as a per-row identifier rather than a feature. The mix of fr and en suffixes hints at a multi-locale product set.","role":"identifier","scope":"column","target":"image_front_thumb_url","treatment":"Drop for modelling; retain as a media link or fetch images if vision features are needed."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This is a low-cardinality categorical with 5 distinct values that look like ISO 639-1 language codes (fr, en, de, bg, ro), suggesting a language tag for each row. The distribution is heavily concentrated: 'fr' accounts for 35 of 50 rows (top_rate 0.70), 'en' for 10, while 'de', 'bg', and 'ro' appear only 1-3 times. Entropy ratio of 0.56 confirms the imbalance, and there are no nulls.","role":"feature","scope":"column","target":"lc","treatment":"One-hot encode, or group rare codes (bg, ro, de) into an 'other' bucket before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.entropy_ratio","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text ingredient lists in French (e.g., 'Lait \u00e9cr\u00e9m\u00e9, cr\u00e8me, sucre...'), likely a debug dump of OpenFoodFacts-style product compositions. Near-maximal entropy (0.997) and 35 unique values out of 50 confirm essentially every non-null row is distinct, while 28% are null and the top value is an empty string appearing twice. Texts vary wildly in length and include allergen markup (_lait_, _soja_) plus stray non-ingredient prose like publication dates.","role":"free_text","scope":"column","target":"ingredients_text_debug","treatment":"Tokenize and embed (or parse into structured allergen/ingredient lists) after imputing empty strings as nulls."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This is a low-cardinality categorical tagging the dominant packaging material, with only 3 distinct values across 50 rows ('en:paper-or-cardboard', 'en:plastic', 'en:unknown'). The headline issue is a 62% null rate, leaving just 19 observed rows where 'en:paper-or-cardboard' alone covers 68.4%. Entropy ratio of 0.70 indicates moderate concentration among the few non-null entries.","role":"feature","scope":"column","target":"packagings_materials_main","treatment":"Impute missing as an explicit 'unknown' category before one-hot encoding."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","n_unique","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `data_quality_dimensions` was skipped by the profiler, so no type, uniqueness, or value statistics were computed beyond a row count of 50 and a null rate of 0.0. Without `n_unique` or any descriptive stats, its content and structure are unknown from this evidence alone. The name suggests it may hold structured or list-like quality metadata, but that cannot be confirmed here.","role":"other","scope":"column","target":"data_quality_dimensions","treatment":"Re-profile with type inference forced, or inspect raw values manually before deciding on use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text serving size descriptors, with 37 unique values across only 50 rows (entropy ratio 0.98) and a 12% null rate. The top value '100g' covers just 6.8% of rows, and inconsistent formatting is rampant \u2014 '100g' vs '100 g', '10 g' vs '20g', plus compound strings like '1 Square (10 g)' \u2014 so the same physical quantity appears under multiple labels.","role":"feature","scope":"column","target":"serving_size","treatment":"Parse into a numeric grams column via regex and unit normalization before use."},{"confidence":"low","critiques":[],"evidence_keys":["column","kind","n","null_rate","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This column is named pnns_groups_1_tags, suggesting it holds Programme National Nutrition Sant\u00e9 top-level group tags (likely a categorical food classification). Saturn skipped profiling, so no uniqueness, frequency, or value statistics are available beyond n=50 and a 0.0 null rate. Without distribution evidence, the cardinality and dominant categories cannot be confirmed.","role":"metadata","scope":"column","target":"pnns_groups_1_tags","treatment":"Re-profile or inspect manually before use; if categorical, encode as a low-cardinality factor."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.entropy_ratio","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text origin/provenance field, likely scraped from product packaging in mixed French/German wording. The column is almost entirely empty: the blank string accounts for 42 of 50 rows (top_rate 0.894) and another 6% are null, leaving only 5 distinct populated values. Entropy ratio of 0.285 and the long_tail alert confirm there is essentially no usable signal as-is.","role":"free_text","scope":"column","target":"origin","treatment":"Drop or parse with regex/NER to extract country tokens; too sparse to use directly."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to be a language code for ingredient text, with only 4 distinct values across 50 rows. French dominates at 70% (35 rows), followed by English (11), with Bulgarian and German trailing at 2 each. The skew is heavy and the entropy ratio of 0.606 confirms concentration around a single language.","role":"metadata","scope":"column","target":"ingredients_lc","treatment":"One-hot encode or use as a filter; consider grouping rare languages into 'other'."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Free-form packaging descriptions, almost certainly from an Open Food Facts-style export, mixing French and English tokens plus language-prefixed tags (e.g. 'fr:Triman', 'en:Bottle'). With 40 unique values across 50 rows and entropy_ratio 0.99, it's near-unique; the top value 'Plastique' covers only 6.98% and 14% are null. Entries are comma-separated multi-tags of varying granularity, so this behaves more like a tag list than a clean category.","role":"free_text","scope":"column","target":"packaging_old","treatment":"Split on commas, normalise language prefixes, and one-hot the resulting tag set rather than treating raw strings as categories."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text French packaging instructions, mostly empty: 34 of 50 rows (top_rate 0.723) are blank and another 6% are null. Of 14 distinct values, the populated ones are heterogeneous descriptions of materials and recycling instructions (plastic films, cardboard \u00e9tuis, aluminium sheets), with one outlier containing OCR-like artefacts and a date string. Entropy ratio 0.49 confirms the long-tail alert: almost every non-empty entry is unique.","role":"free_text","scope":"column","target":"packaging_text_fr","treatment":"Treat blanks as missing and parse remaining strings for material/recyclability tokens rather than using as a categorical."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"A categorical debug/diagnostic field, presumably trace messages from a NOVA food-group classifier. It's overwhelmingly empty (96% blank, 48 of 50 rows), with only two non-empty entries \u2014 both error strings explaining that NOVA classification was skipped due to unknown ingredients. Entropy ratio of 0.178 confirms near-zero information content.","role":"metadata","scope":"column","target":"nova_group_debug","treatment":"Drop; near-constant debug log with no modelling value."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `ingredients_original_tags` was skipped by the profiler, so no statistics, uniqueness, or value samples are available beyond a row count of 50 and a null rate of 0.0. The name suggests a list-valued field of ingredient tags (likely arrays or delimited strings), which is consistent with the profiler classifying it as `unknown` and bailing out. Without type or cardinality signals, nothing further can be inferred from the evidence.","role":"free_text","scope":"column","target":"ingredients_original_tags","treatment":"Parse the list/array structure and explode or multi-hot encode before downstream use."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","n_unique","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column is named data_quality_completeness_tags but saturn skipped profiling it, so its kind is unknown and no uniqueness or value statistics were computed. The only confirmed signals are that it has 50 rows with a null rate of 0.0. Without sample values or cardinality, its actual content (likely tag strings about completeness checks) cannot be verified from the evidence.","role":"other","scope":"column","target":"data_quality_completeness_tags","treatment":"Re-profile with explicit parsing before deciding how to use it downstream."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","n","null_rate","kind","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"The column `cities_tags` was skipped by the profiler, so no type inference, uniqueness count, or value statistics are available. Only two facts are known: 50 rows were seen and none were null. Without further stats the content and structure cannot be characterised.","role":"other","scope":"column","target":"cities_tags","treatment":"Re-profile or inspect raw values manually before deciding on downstream use."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Column `countries_hierarchy` was skipped by the profiler, so no kind, uniqueness, or value statistics are available beyond a row count of 50 with zero nulls. The name suggests a nested or list-like representation of country tags (e.g., `en:france > en:europe`), which likely tripped the type detector. Treat the absence of stats as a signal that the values are non-scalar rather than missing.","role":"feature","scope":"column","target":"countries_hierarchy","treatment":"Parse the hierarchical strings into a list of country tags, then explode or one-hot encode before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["min","max","mean","median","q1","q3","iqr","skew","kurtosis","n_outliers","null_rate","zero_rate","n_unique","n","std"],"model":"anthropic:claude-opus-4-7","narrative":"Numeric column holding the negation of a Nutri-Score (range -40 to 0, median -19), so lower values correspond to better nutritional grades. Distribution is roughly symmetric (skew 0.16, kurtosis -0.53) with no outliers and a tight IQR of 15. Notable signals: 2% nulls, 8% zeros, and only 28 unique values across 50 rows, consistent with an integer score derived by sign-flipping the original Nutri-Score.","role":"feature","scope":"column","target":"nutriscore_score_opposite","treatment":"Use as-is for modelling, or invert the sign back to the original Nutri-Score for interpretability."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `categories_properties_tags` was skipped by the profiler, so no type, uniqueness, or value statistics are available beyond a row count of 50 and a null rate of 0.0. The name suggests a nested or multi-valued field (categories/properties/tags), which likely tripped the dissector's scalar assumptions. Without distinct-value or sample evidence, its actual content and cardinality are unknown.","role":"other","scope":"column","target":"categories_properties_tags","treatment":"Re-profile after flattening or JSON-parsing this field before deciding on downstream use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This is a lowercase language/origin code with 6 distinct values across 50 rows and a 4% null rate. The distribution is dominated by 'fr' (23) and 'en' (20), together accounting for nearly all non-null entries, while 'es', 'de', 'it', and 'pl' appear only once or twice each. Entropy ratio of 0.61 confirms the heavy concentration in two categories.","role":"feature","scope":"column","target":"origins_lc","treatment":"One-hot encode with rare categories (es/de/it/pl) collapsed into an 'other' bucket."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","n_unique","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column, ciqual_food_name_tags, was skipped by the profiler so no distributional statistics are available. The only confirmed signals are 50 rows present and a null rate of 0.0; uniqueness, value samples, and type are all missing. Based on the name alone it likely holds CIQUAL food-name tag strings, but that cannot be verified from the evidence.","role":"other","scope":"column","target":"ciqual_food_name_tags","treatment":"Re-run the profiler on this column to recover type and cardinality before deciding on use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text country list per record, not a clean categorical: 43 unique values across 50 rows (entropy ratio 0.97) with the top value 'Maroc' at only 10%. Values mix languages (Maroc vs Morocco, Belgique vs Belgium), comma-separated multi-country strings, and even an 'en:switzerland' prefix, so the same country appears in several surface forms. The 'long_tail' alert is consistent with this near-unique, multi-label encoding.","role":"free_text","scope":"column","target":"countries","treatment":"Split on commas, normalise language and prefixes to ISO country codes, then one-hot or multi-hot encode."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Italian-language ingredient lists with embedded HTML <span class=\"allergen\"> markup, one row per product. Coverage is poor: 68% of the 50 rows are null and the most common non-null value is the empty string (5 occurrences, 31% of present values), leaving only a handful of genuine ingredient strings. Among the 12 distinct values, contents range from short lists (e.g. \"patate, olio di girasole, sale marino.\") to long compound declarations, so length and structure vary widely.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_it","treatment":"Strip HTML allergen tags, treat empty strings as null, then tokenize for NLP or extract allergen flags as features."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to be the language code of packaging text, with 7 distinct ISO-style codes across 50 rows. French and English tie at 17 occurrences each, though the reported top_rate of 0.386 reflects only one being chosen as top_value ('fr'); German trails at 5, with Portuguese, Italian, Spanish, and Croatian as singletons. A 12% null rate and entropy ratio of 0.71 indicate moderate diversity but a clear FR/EN dominance.","role":"metadata","scope":"column","target":"packaging_lc","treatment":"Treat as a low-cardinality categorical; impute nulls and one-hot encode, optionally collapsing rare codes into 'other'."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `correctors_tags` was skipped by the profiler, so no type, uniqueness, or distributional statistics are available beyond a row count of 50 and a null rate of 0.0. The name suggests it holds tags identifying correctors, plausibly a list- or set-valued field that the dissector could not coerce into a known kind. Without further stats, nothing can be said about cardinality, value mix, or skew.","role":"other","scope":"column","target":"correctors_tags","treatment":"Re-profile after parsing into a primitive type (e.g., explode tags into strings) before deciding on use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to record the interface version in use when each record was created, encoded as a date-stamp with optional jQuery Mobile suffix. Only 3 distinct values appear across 50 rows, with '20120622' dominating at 59.2% and a long-tail '20130323.jqm' appearing just twice. Entropy ratio of 0.74 confirms moderate concentration, and there is a 2% null rate to account for.","role":"metadata","scope":"column","target":"interface_version_created","treatment":"Treat as a low-cardinality categorical; one-hot encode or bucket the rare '20130323.jqm' level."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","n_unique","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column was skipped by the profiler, so no statistics beyond row count (50) and a 0.0 null rate are available. The name suggests it holds tag-like state markers, possibly multi-valued, but kind is reported as unknown and uniqueness is not measured. Without sampled values or cardinality, its content and structure cannot be characterised from the evidence.","role":"other","scope":"column","target":"states_tags","treatment":"Re-profile with parsing enabled (likely a delimited tag list) before deciding whether to one-hot or drop."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","column","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column is labelled nutriscore_2021_tags, suggesting Nutri-Score grade tags from a 2021 reference (typically values like a/b/c/d/e). Saturn skipped profiling, so no distribution, uniqueness, or value statistics are available beyond a row count of 50 and a 0.0 null rate. No further signal can be extracted without re-profiling.","role":"feature","scope":"column","target":"nutriscore_2021_tags","treatment":"Re-profile or inspect manually; if confirmed categorical, treat as an ordinal Nutri-Score grade."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column was skipped by the profiler, so no type, uniqueness, or value statistics are available beyond a row count of 50 and a null rate of 0.0. The name suggests a multi-valued tag field associated with stores (likely a list or delimited string), but this cannot be confirmed from the evidence.","role":"other","scope":"column","target":"stores_tags","treatment":"Re-profile after parsing as a list/array to determine cardinality and tag distribution before use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds Open Food Facts product thumbnail URLs, one per row. Every one of the 50 values is unique (entropy_ratio 1.0, top_rate 0.02), so it acts as a per-row asset pointer rather than a categorical feature. URLs mix `front_fr` and `front_en` locale suffixes, hinting at a French/English product mix.","role":"metadata","scope":"column","target":"image_thumb_url","treatment":"Drop for modelling; retain only as a display link or for image-fetching pipelines."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","n_unique","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column was skipped by the profiler, so its type, cardinality, and value distribution are unknown beyond a count of 50 rows with no nulls. The name `categories_properties` suggests a nested or structured field (e.g., a list or dict of category attributes) that the profiler could not coerce into a scalar kind. Without parsed contents there is nothing further to infer.","role":"other","scope":"column","target":"categories_properties","treatment":"Inspect raw values and parse the nested structure (explode or flatten) before profiling again."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"Saturn skipped profiling for this column, so its type and contents are unknown beyond a row count of 50 and a null rate of 0.0. The name suggests it holds prior tags associated with nucleotide records, possibly a list or nested structure that the profiler could not introspect. No uniqueness, distribution, or value statistics are available to characterise it further.","role":"other","scope":"column","target":"nucleotides_prev_tags","treatment":"Inspect raw values manually to determine structure before deciding on parsing or encoding."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.cardinality","stats.entropy_ratio","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text allergen list parsed from ingredient strings, mixing Open Food Facts taxonomy codes (en:gluten, en:milk, en:soybeans) with raw multilingual tokens (bl\u00e9, lait, NOISETTES, \u0441\u043e\u0435\u0432\u0438). 30% of the 50 rows are empty strings and the remaining 35 unique values are nearly all singletons with duplicated tokens within a single cell, so this is dirty list-encoded data rather than a clean category.","role":"feature","scope":"column","target":"allergens_from_ingredients","treatment":"Split on commas, normalize to en: taxonomy codes, dedupe tokens, then multi-hot encode."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_value","top_rate","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Finnish-language ingredient text with inline HTML allergen markup, mirroring the multilingual ingredient fields common in Open Food Facts. Coverage is extremely thin: null_rate is 0.9 and only 4 distinct values exist across n=50, with the empty string itself appearing twice as the top_value (top_rate 0.4 of non-nulls). The non-empty entries are long free-text strings wrapping allergens in <span class=\"allergen\"> tags rather than clean tokens.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_fi","treatment":"Strip HTML tags and tokenize for allergen extraction; otherwise drop, since 90% are null."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `_keywords` was skipped by the profiler, so kind is unknown and no statistics (n_unique, value distribution, length, etc.) are available. The only confirmed signals are 50 rows with a 0.0 null rate. Without further evidence the content and structure cannot be characterised \u2014 the name suggests a keyword list, but this is not verified.","role":"other","scope":"column","target":"_keywords","treatment":"Re-profile with appropriate parser (likely list/tokenized text) before deciding usage."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text manufacturing locations, mostly country names but mixed with multi-token strings combining cities, regions, and postal codes. The dominant value is the empty string (20 of 50, top_rate 0.408), making missing-or-blank the modal state, with France a distant second at 9. Across 20 unique values the entropy_ratio of 0.737 plus the long_tail alert signals scattered, inconsistent formatting (e.g. 'France,Italie' vs full German address chains).","role":"free_text","scope":"column","target":"manufacturing_places","treatment":"Normalise blanks to null and parse/standardise to country tokens before using as a feature."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This is a food sub-category label (PNNS group 2), with 11 distinct values across 50 rows and no nulls. The distribution is heavily concentrated in sweets: 'Biscuits and cakes' (17) and 'Chocolate products' (16) account for 33 of 50 rows, giving a top_rate of 0.34 and entropy_ratio of 0.75. Two rows carry the literal value 'unknown', which should be treated as missing rather than a real category.","role":"label","scope":"column","target":"pnns_groups_2","treatment":"One-hot or target-encode after recoding 'unknown' to null."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_value","top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Polish-language ingredient text for food products, almost entirely absent in this sample: 90% of rows are null and of the 5 non-null rows, 3 are empty strings, leaving only 2 genuine ingredient lists (both for cocoa-based chocolate). With n_unique=3 across 50 rows, this column carries virtually no usable signal here.","role":"free_text","scope":"column","target":"ingredients_text_pl","treatment":"Drop unless Polish-language analysis is required; too sparse to model."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Spanish-language generic product name, sparsely populated with only 7 unique values across 50 rows and a 60% null rate. The non-null values skew heavily toward dark chocolate descriptions (e.g., 'Chocolate negro' appears twice, with several variants citing cacao percentages), suggesting the dataset is dominated by chocolate products. Top rate of 0.65 reflects the empty string acting as the modal 'value', so usable coverage is even thinner than the null rate alone implies.","role":"metadata","scope":"column","target":"generic_name_es","treatment":"Treat empty strings as nulls and drop or backfill from a canonical product-name field before use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Categorical column likely intended to mark country of origin in English, but it is effectively empty: of 50 rows, 14% are null and 42 of the remaining values are blank strings, leaving just one populated label (\"France\"). Cardinality is 2 with a top_rate of 0.977 and entropy_ratio of 0.16, so the field carries almost no information.","role":"metadata","scope":"column","target":"origin_en","treatment":"Drop; the column is near-constant with blanks and only one real value."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_value","top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Italian generic product name, evidently a localized label field on food items. 68% of rows are null and among the 16 non-null entries the most common value is the empty string (11 occurrences), leaving only 5 distinct real names like 'Cioccolato extra fondente' and 'Crackers'. Coverage is too sparse to be useful as-is.","role":"metadata","scope":"column","target":"generic_name_it","treatment":"Drop or defer until Italian coverage improves; not usable at 68% null."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.zero_rate","stats.median","stats.iqr","stats.max","stats.skew","stats.kurtosis","stats.outlier_rate","stats.n_outliers"],"model":"anthropic:claude-opus-4-7","narrative":"Count of ingredients that may be derived from palm oil per product. Values are extremely concentrated at zero (zero_rate 0.83, median and IQR both 0), with only 3 distinct values up to a max of 2, yet 17% of non-null rows register as outliers and skew is 2.23. An 8% null rate also means some products lack this assessment entirely.","role":"feature","scope":"column","target":"ingredients_that_may_be_from_palm_oil_n","treatment":"Binarise to zero/non-zero or drop, since the column is near-constant with heavy skew."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Spanish-language ingredient lists for food products, stored as free text. Of 50 rows, 60% are null and another 8 entries (top_rate 0.4) are empty strings, leaving only a handful of distinct populated values\u2014mostly chocolate and cereal formulations with allergen markers like _TRIGO_ and _HUEVO_. The 13-value cardinality and high entropy ratio (0.84) reflect that nearly every non-empty entry is unique long-form prose, not a true category.","role":"free_text","scope":"column","target":"ingredients_text_es","treatment":"Treat as multilingual free text: tokenize/embed or parse into ingredient lists; do not use as a categorical feature."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds team affiliations as comma-separated lists of slugs, with 39 unique combinations across 50 rows and an 8% null rate. Cardinality is extreme (entropy ratio 0.97) and the most common value 'pain-au-chocolat' covers only 10.9%, while several rows pack 4-14 teams into one string. The mix of single-team and multi-team entries means this is effectively a multi-label field stored as a delimited string.","role":"feature","scope":"column","target":"teams","treatment":"split on commas and one-hot encode as multi-label team membership before modelling."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","column","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column is labeled food_groups_tags, suggesting it holds categorical food group classifiers (likely list-valued or comma-delimited tags). Saturn skipped profiling, so no uniqueness, cardinality, or distribution stats are available beyond a 50-row sample with zero nulls. Treat any inferences cautiously until the column is re-profiled with a parser that handles its native type.","role":"feature","scope":"column","target":"food_groups_tags","treatment":"Re-profile after parsing as a list/multi-label field, then one-hot or multi-hot encode the tags."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column is named data_quality_warnings_tags, suggesting it carries flags or tag arrays describing data quality issues per row. Saturn skipped profiling, so no uniqueness, value distribution, or stats are available beyond a 50-row sample with 0% nulls. Without parsed contents it is impossible to tell whether the field is empty strings, lists, or structured tags.","role":"metadata","scope":"column","target":"data_quality_warnings_tags","treatment":"Inspect raw values manually and parse tag structure before deciding on use."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Column 'debug_tags' was skipped by the profiler and classified as kind 'unknown', so no descriptive statistics are available beyond a row count of 50 and a null rate of 0.0. Uniqueness, distribution, and content type are all unreported, meaning we cannot infer what the field carries. The name suggests internal debugging annotations rather than analytical signal.","role":"metadata","scope":"column","target":"debug_tags","treatment":"Drop unless a downstream consumer specifically needs the debug annotations."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"The column `main_countries_tags` was skipped during profiling, so no type, cardinality, or value statistics are available beyond a row count of 50 and a null rate of 0.0. The name suggests a tags-style field listing principal countries, likely delimited or list-valued, which is probably why the profiler bailed. Nothing else can be inferred without re-profiling with list/text handling enabled.","role":"feature","scope":"column","target":"main_countries_tags","treatment":"Re-profile as a multi-valued tag field, then split/explode and one-hot encode before modelling."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Profiling was skipped for this column, so saturn emitted no type, uniqueness, or value statistics beyond a row count of 50 and a null rate of 0.0. The name suggests a nested or path-like representation of origin categories (e.g. a taxonomy hierarchy), but without parsed values this is inference from the label only. Treat it as opaque until reprofiled.","role":"other","scope":"column","target":"origins_hierarchy","treatment":"Reprofile after parsing the hierarchy (split path or explode levels) before deciding on use."},{"confidence":"high","critiques":[],"evidence_keys":["n_unique","min","max","mean","zero_rate","null_rate","kurtosis"],"model":"anthropic:claude-opus-4-7","narrative":"This is a binary 0/1 flag (n_unique=2, min=0, max=1) indicating whether packaging information is complete. The split is nearly even with a mean of 0.52 and zero_rate of 0.48, and 4% of rows are null. The strongly negative kurtosis (-1.99) is expected for a balanced binary variable.","role":"feature","scope":"column","target":"packagings_complete","treatment":"Cast to boolean and impute the 4% nulls before modelling."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","column","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column is labeled nutriscore_tags, suggesting it holds Nutri-Score classification tags (likely letter grades a-e or arrays thereof) for food products. Profiling was skipped, so no cardinality, value distribution, or type stats are available beyond a 50-row sample with zero nulls. Without n_unique or value frequencies, the actual contents and structure remain unverified.","role":"label","scope":"column","target":"nutriscore_tags","treatment":"Re-profile with parsing enabled, then one-hot or ordinal-encode the Nutri-Score grade for modelling."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Dutch-language ingredient lists with inline HTML `<span class=\"allergen\">` markup, evidently the NL localisation of an Open Food Facts-style ingredients field. Coverage is poor: 78% null and only 9 distinct values across 50 rows, with the most common non-null entries being short cocoa/chocolate ingredient strings while one row is clearly mis-parsed packaging footer text (Mondelez addresses, URLs). Entropy ratio 0.95 confirms the few present values are nearly all unique, so this is free text rather than a category.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_nl","treatment":"Strip HTML allergen tags, then tokenize for NLP/allergen extraction; expect heavy missingness so do not use as a primary feature."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.skew","stats.kurtosis"],"model":"anthropic:claude-opus-4-7","narrative":"Values are 10-digit integers ranging from 1,337,517,352 to 1,724,094,916 with all 50 rows unique and no nulls \u2014 consistent with Unix epoch seconds spanning roughly mid-2012 to mid-2024. The distribution is mildly right-skewed (skew 0.33) and platykurtic (kurtosis -0.81), with a median of 1,475,927,880.5 sitting near the mean, suggesting events are spread fairly evenly across the window rather than clustered. The name 'created_t' reinforces a creation-timestamp interpretation.","role":"timestamp","scope":"column","target":"created_t","treatment":"convert from Unix seconds to datetime and derive features (year, recency) before modelling."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","n_unique","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"Column 'traces_hierarchy' was skipped by the profiler, so no type, uniqueness, or value statistics are available beyond a row count of 50 and a null rate of 0.0. Without kind inference or sample stats, the content remains unknown \u2014 the name hints at nested trace/hierarchy data (likely a complex or non-scalar structure), which is consistent with the profiler skipping it.","role":"other","scope":"column","target":"traces_hierarchy","treatment":"Inspect raw values manually and parse the nested structure before it can be profiled or modelled."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Norwegian Bokm\u00e5l generic name field, likely meant to hold localized drug or product names. It is effectively empty: 96% of the 50 rows are null and the only non-null value observed is the empty string (2 occurrences), giving cardinality 1 and zero entropy.","role":"metadata","scope":"column","target":"generic_name_nb","treatment":"Drop; the column carries no information."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.entropy_ratio","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"German-language ingredient lists with embedded HTML <span class=\"allergen\"> tags marking allergens like SOJA, WEIZEN, and HASELN\u00dcSSE. Two-thirds of rows are null (null_rate 0.66) and among the 17 non-null values 16 are unique (entropy_ratio 0.99), with the empty string itself appearing twice as the top value. Casing and punctuation are inconsistent across entries, and one row contains lowercase OCR-style text with stray newlines.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_de","treatment":"Strip HTML tags to extract allergen labels into a multi-hot feature, then drop or embed the residual text."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Spanish-language ingredients lists with inline <span class=\"allergen\"> HTML markup highlighting allergens like trigo, soja, avellanas, and lactosa. 62% of the 50 rows are null and another 7 entries are empty strings, leaving only a handful of populated free-text recipes; among those that exist, all 13 unique values appear nearly distinct (entropy ratio 0.87).","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_es","treatment":"Strip the allergen HTML tags, then tokenize/embed or parse into a structured allergen list before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"French-language product names from what appears to be a food/grocery catalogue (chocolate bars, mineral water, biscuits). With 47 unique values across 50 rows and entropy ratio 0.996, this is essentially a free-text label rather than a categorical feature \u2014 the top value 'Henry's' only appears twice (4%). One null and a long-tail alert are flagged.","role":"free_text","scope":"column","target":"product_name_fr","treatment":"Treat as free-text product label; tokenize and embed (or use as a join key to a product table) rather than one-hot encoding."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Comma-delimited list of retail chains where each product was observed (Lidl, Carrefour, Tesco, etc.), stored as a single string per row. Cardinality is high (31 unique across 50 rows, entropy_ratio 0.854) because most non-empty entries are bespoke multi-store concatenations appearing only once. The dominant value is an empty string at 29.17% top_rate plus a 4% null_rate, so roughly a third of rows carry no store information at all.","role":"feature","scope":"column","target":"stores","treatment":"Split on comma and one-hot or multi-hot encode individual store names; treat empty string as missing."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column is a unique record identifier \u2014 every one of the 50 rows has a distinct value (n_unique=50, top_rate=0.02, entropy_ratio=1.0). Values look like long numeric codes resembling EAN/GTIN barcodes (e.g., '6111242100992', '7622210578464'), with at least one shorter outlier ('20995553'). The long_tail alert simply reflects that each value occurs exactly once.","role":"identifier","scope":"column","target":"_id","treatment":"drop from modelling features; retain as a join key."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'nutriments' was skipped by the profiler, so no statistics, uniqueness, or value samples are available beyond a row count of 50 and a null rate of 0.0. The name suggests it likely holds nested nutritional data (e.g., a struct or JSON object per product), which is consistent with the profiler's inability to classify it as a standard kind. Without parsed contents we cannot describe its distribution or cardinality.","role":"other","scope":"column","target":"nutriments","treatment":"Parse/flatten the nested structure into typed sub-columns before profiling or modelling."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column is named \"editors\" and was skipped by the profiler, so its kind is unknown and no descriptive statistics were computed. Across 50 rows there are zero nulls, but uniqueness, type, and value distribution are all unreported. Without further evidence, the content (likely a list or nested structure of editor entries) cannot be characterised.","role":"other","scope":"column","target":"editors","treatment":"Inspect raw values manually to determine type before deciding whether to parse, explode, or drop."},{"confidence":"medium","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"`max_imgid` holds 38 distinct integer-like strings across 50 rows with no nulls, suggesting it stores the maximum image identifier per record. Distribution is nearly uniform (entropy_ratio 0.98) with the top value '47' appearing only 3 times (top_rate 0.06), so it behaves like a high-cardinality numeric id mis-typed as categorical. The long_tail alert confirms most values occur once or twice.","role":"identifier","scope":"column","target":"max_imgid","treatment":"Cast to integer and treat as a numeric id; do not one-hot encode."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This is the Nutri-Score grade, a categorical food-health rating with the expected letter levels a-e plus an 'unknown' bucket, giving 6 distinct values across 50 rows with no nulls. The distribution is heavily weighted toward the worst grade: 'e' alone accounts for 54% (27/50), while healthier grades 'a' and 'b' together cover only 6 rows. Entropy ratio of 0.74 confirms the imbalance, and the lone 'unknown' row signals a missing-data sentinel mixed in with the real grades.","role":"label","scope":"column","target":"nutriscore_grade","treatment":"Treat as ordered categorical (a<b<c<d<e) and recode 'unknown' as missing before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Unit of measure for product quantities, taking only 'g' or 'ml'. The distribution is severely imbalanced: 'g' covers 44 of 45 non-null rows (top_rate 0.978) while 'ml' appears just once, and 10% of values are null. Entropy ratio of 0.154 confirms the column carries almost no information as-is.","role":"metadata","scope":"column","target":"product_quantity_unit","treatment":"Likely drop or collapse to a binary indicator; near-constant with one rare 'ml' case."},{"confidence":"low","critiques":[],"evidence_keys":["column","kind","n","null_rate","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This column is labelled ingredients_analysis_tags, suggesting it carries categorical or list-valued tags from an ingredient analysis pipeline. Saturn skipped profiling, so no uniqueness, frequency, or value statistics are available beyond a 50-row sample with zero nulls. Without further stats, neither cardinality nor structure (scalar vs. list) can be confirmed.","role":"metadata","scope":"column","target":"ingredients_analysis_tags","treatment":"Re-profile with list/tag-aware parsing before deciding to one-hot encode or drop."},{"confidence":"high","critiques":[],"evidence_keys":["kind","n","n_unique","null_rate","stats.entropy_ratio","stats.top_value","stats.top_rate","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"French-language ingredient lists with embedded HTML <span class=\"allergen\"> markup highlighting allergens. Near-unique across 47 of 50 rows (entropy ratio 0.998), with 4% nulls and 2 empty strings as the modal value. Content varies wildly in length and formatting, mixing prose, percentages, and tagged allergen tokens.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_fr","treatment":"Strip HTML tags, parse allergen spans into a structured list, then tokenize the remaining text for NLP."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"A categorical column capturing an interface version stamp, with only 2 distinct values across 50 rows and no nulls. The distribution is heavily skewed: '20150316.jqm2' covers 84% (42 rows) while '20190830' accounts for the remaining 8 rows. The mixed format (one value carries a '.jqm2' suffix, the other is a bare date) suggests a schema or convention change between releases.","role":"metadata","scope":"column","target":"interface_version_modified","treatment":"Treat as a binary version flag; one-hot encode or collapse to pre/post-change indicator."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","n_unique","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'data_sources_tags' was skipped by the profiler, so its kind, uniqueness, and value distribution are all unknown. The only confirmed signals are 50 rows with no nulls. Without parsed stats, the name suggests a multi-valued tag field (e.g., a list or delimited string of source labels), but this cannot be verified from the evidence.","role":"other","scope":"column","target":"data_sources_tags","treatment":"Manually inspect a sample to confirm structure, then explode tags into a multi-hot encoding before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.entropy_ratio","stats.top_value","stats.top_rate","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds English ingredient lists with embedded HTML <span class=\"allergen\"> markup highlighting allergens like wheat, milk, soy, and nuts. With 36 unique values across 50 rows (entropy ratio 0.95) and a 16% null rate, it's near-unique free text; the top 'value' is actually the empty string (7 occurrences), and one row is junk ('Hhhhh'). The HTML tags and inconsistent casing/punctuation mean it needs cleaning before any allergen extraction.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_en","treatment":"Strip HTML, normalize case, and parse allergen spans into a structured multi-label feature before modelling."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Column `removed_countries_tags` was skipped by the profiler, so no type, uniqueness, or distribution stats are available. The only facts on hand are 50 rows with a 0.0 null rate. The name suggests a list of country tags that were removed (likely a multi-valued tag field from an Open Food Facts-style schema), but this cannot be confirmed from the evidence.","role":"other","scope":"column","target":"removed_countries_tags","treatment":"Re-profile with list/string parsing enabled before deciding whether to keep, explode, or drop."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","n_unique","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column was skipped by the profiler, so no type, uniqueness, or value statistics are available beyond a row count of 50 and a null rate of 0.0. The name suggests it holds prior tag values associated with amino acid annotations, likely a list-like or structured field that the dissector could not parse. Nothing else can be inferred without re-profiling.","role":"other","scope":"column","target":"amino_acids_prev_tags","treatment":"Re-profile with a parser that handles its container type before deciding on downstream use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds 50 unique numeric strings of varying length (8 to 13 digits), almost certainly product barcodes (EAN/UPC/GTIN). Every one of 50 rows is unique with no nulls, giving maximum entropy (entropy_ratio 1.0) and a top_rate of just 0.02 \u2014 it functions as a row identifier rather than a feature. The long_tail alert simply reflects that uniqueness.","role":"identifier","scope":"column","target":"code","treatment":"Use as a join key; drop from any model as it carries no predictive signal."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'correctors' was skipped by the profiler, so its kind, uniqueness, and value distribution are unknown. Only the row count (50) and a null rate of 0.0 are reported; no other statistics are available to characterize content.","role":"other","scope":"column","target":"correctors","treatment":"Re-profile or inspect manually before deciding on use."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","n","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"Likely a Japanese generic-name field (generic_name_ja), but it carries essentially no information in this sample: 98% of 50 rows are null and the single non-null value is an empty string, giving cardinality 1 and entropy 0.","role":"metadata","scope":"column","target":"generic_name_ja","treatment":"Drop from modelling; retain only if needed for display lookups."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"French-language generic product names, almost certainly from an Open Food Facts-style food catalogue. Cardinality is high (34 unique across 50 rows, entropy ratio 0.87) and most values are one-off descriptors like 'Chocolat noir extra-fin traditionnel \u00e0 90% de cacao'. The dominant 'value' is actually the empty string at 29.8% of non-null rows, on top of a 6% null rate, so effectively over a third of records carry no usable label.","role":"free_text","scope":"column","target":"generic_name_fr","treatment":"Treat empty strings as missing, then tokenize/embed for any modelling rather than one-hot encoding."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_values","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"Polish-language generic product name field, populated for only 5 of 50 rows (90% null) and containing just 2 distinct values where 4 of the 5 non-nulls are empty strings. Effectively a single real value ('Wy\u015bmienita czkolada gorzka 70% kakao'), making the column unusable as a feature.","role":"metadata","scope":"column","target":"generic_name_pl","treatment":"Drop; null rate 0.9 and only one meaningful value."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","column","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column is labelled amino_acids_tags, suggesting it would hold tags describing amino acid composition (likely a list-valued food annotation field). Saturn skipped profiling, so no uniqueness, cardinality, or value statistics are available beyond an n of 50 and a 0.0 null rate. Nothing further can be inferred without re-profiling.","role":"other","scope":"column","target":"amino_acids_tags","treatment":"Re-profile after parsing as a list/tag field before deciding on encoding."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Column 'ingredients_debug' was skipped by the profiler, so no type, uniqueness, or distribution stats are available. Only the row count (50) and null rate (0.0) are known; everything else is missing. The name suggests it is a debug/auxiliary field rather than a modelling input.","role":"metadata","scope":"column","target":"ingredients_debug","treatment":"Drop from modelling; retain only if needed for debugging upstream pipelines."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Japanese-language ingredient text with allergen markup, almost entirely absent from this sample. 98% of the 50 rows are null, and the only non-null value observed is an empty string, giving a cardinality of 1 and entropy of 0. There is no usable signal here.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_ja","treatment":"Drop; the column carries no information in this sample."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"This column, data_quality_info_tags, was skipped by the profiler so its type and contents remain uncharacterised. The only signals available are 50 rows with no nulls; uniqueness, value distribution, and data kind are all unknown.","role":"other","scope":"column","target":"data_quality_info_tags","treatment":"Inspect raw values manually to determine type before deciding on handling."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column was skipped by the profiler, so no type, uniqueness, or distribution stats are available beyond a row count of 50 with no nulls. The name suggests it holds last-edit dates paired with tags, likely a composite or nested field that the dissector could not parse. Without further evidence, its structure and content cannot be characterised.","role":"other","scope":"column","target":"last_edit_dates_tags","treatment":"Inspect raw values and parse into separate date and tag fields before use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column records the user or app that last modified each record, dominated by the bot/account 'foodless' which accounts for 21 of 49 non-null entries (top_rate 0.43). With 24 unique values across 50 rows and entropy_ratio 0.77, there's a long tail of mostly singleton contributors alongside a handful of app-like editors (municorn-calorie-counter-app, macrofactor). Null rate is low at 0.02.","role":"metadata","scope":"column","target":"last_modified_by","treatment":"Keep as audit metadata; if used as a feature, collapse the long tail into 'other' and flag bot-vs-human editors."},{"confidence":"high","critiques":[],"evidence_keys":["n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"A flag column indicating products lacking nutrition data, but it carries no information here: the only observed value is the empty string, present in all 48 non-null rows (top_rate 1.0, cardinality 1, entropy 0.0). 4% of rows are null, so there is literally nothing to distinguish records.","role":"feature","scope":"column","target":"no_nutrition_data","treatment":"Drop; constant column with zero entropy."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"The column is named \"nutriscore\" but saturn skipped profiling it (kind=\"unknown\"), so no type, uniqueness, or distribution stats are available. All 50 rows are non-null, but nothing else can be confirmed from the evidence.","role":"other","scope":"column","target":"nutriscore","treatment":"Manually inspect and cast to a known type before any downstream use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'origin_nb' is effectively empty: 96% of the 50 rows are null and the only non-null value observed is the empty string, which appears twice. Cardinality is 1 with zero entropy, so the field carries no information in this sample.","role":"metadata","scope":"column","target":"origin_nb","treatment":"Drop; the column is 96% null with a single empty-string value."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text origin/provenance strings for ingredients or products, with 20 unique values across 50 rows and a 4% null rate. The dominant value is the empty string at 24/50 (top_rate 0.5), so half the column is effectively blank rather than missing. The remainder is messy: language mix (France vs Maroc vs Morocco), comma-delimited multi-origin lists, and 'en:'-prefixed taxonomy tags like 'en:Madagarcar vanilla' (note the typo) \u2014 clearly not a clean categorical.","role":"free_text","scope":"column","target":"origins","treatment":"Treat empty strings as null, normalise synonyms (Maroc/Morocco), and split on comma into a multi-label set before any encoding."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","column","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column is named nova_groups_tags, suggesting it carries NOVA food-classification group tags (a 1-4 processing-level scheme used in nutrition datasets). However, saturn skipped profiling it, so no type, cardinality, or value statistics are available beyond a 50-row sample with zero nulls. Without inferred kind or unique counts, the actual content and format remain unverified.","role":"metadata","scope":"column","target":"nova_groups_tags","treatment":"Manually inspect raw values to confirm format, then one-hot encode the small set of NOVA group tags."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column is named 'languages' but saturn skipped profiling, so type and distribution are unknown. With 50 rows and no nulls, every record carries some value, yet n_unique and other stats are unavailable. The name suggests a list-like field (e.g., languages spoken or supported), which would explain why the dissector flagged it as unknown.","role":"other","scope":"column","target":"languages","treatment":"Inspect raw values and parse (likely explode list-typed entries) before further profiling."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column is flagged as skipped by the profiler, so no descriptive statistics, uniqueness, or value samples are available beyond a row count of 50 and a 0.0 null rate. The name suggests it holds Nutri-Score 2023 classification tags (likely a categorical label such as a, b, c, d, e), but that interpretation cannot be verified from the evidence provided. No distributional or quality signals can be assessed here.","role":"other","scope":"column","target":"nutriscore_2023_tags","treatment":"Re-run profiling with this column included to determine its type and cardinality before use."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","column","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to be a tags field listing packaging materials, likely a delimited or list-valued string per row. Saturn skipped profiling, so no uniqueness, cardinality, or value-frequency stats are available beyond a 50-row sample with zero nulls. Without parsed token statistics, the actual material vocabulary and its distribution remain unknown.","role":"free_text","scope":"column","target":"packaging_materials_tags","treatment":"split on the tag delimiter and one-hot or multi-hot encode the resulting material tokens before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This is a language code column with 5 distinct values and no nulls across 50 rows. The distribution is heavily dominated by 'fr' at 70% (35/50), with 'en' a distant second at 10 occurrences and 'de', 'bg', 'ro' appearing only 1-3 times each. Entropy ratio of 0.56 confirms the imbalance, and the long tail of rare languages (bg, ro with single observations) may be unstable for any per-language modelling.","role":"feature","scope":"column","target":"lang","treatment":"One-hot encode with rare languages (bg, ro, de) collapsed into an 'other' bucket."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Swedish packaging text field that is effectively empty: 92% of the 50 rows are null and the remaining 4 non-null values are all the empty string, giving a single observed category with entropy 0. There is no usable signal here.","role":"free_text","scope":"column","target":"packaging_text_sv","treatment":"Drop; column is 92% null and the only non-null value is an empty string."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column 'photographers' was skipped by the profiler, so no type, uniqueness, or value statistics are available beyond a row count of 50 and a null rate of 0.0. The name suggests it holds photographer attributions, possibly as a list or nested structure that the dissector could not parse. Without unique counts or sample values, nothing further can be inferred.","role":"other","scope":"column","target":"photographers","treatment":"Inspect raw values manually to determine structure before deciding whether to parse, explode, or drop."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column is named languages_codes but saturn skipped detailed profiling, leaving kind as unknown with no uniqueness or value statistics. The only confirmed signals are 50 rows and a 0.0 null rate. Without sample values or cardinality, the structure (single code, list, or delimited string) cannot be determined from the evidence.","role":"other","scope":"column","target":"languages_codes","treatment":"Re-profile with parsing enabled to determine whether values are scalar codes or lists before use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This is the Eco-Score grade, a categorical environmental rating with letter tiers from a-plus through f plus sentinel values 'unknown' and 'not-applicable'. Distribution skews toward worse grades: 'e' leads at 12/50 (top_rate 0.24), followed by 'd' (9), while 'a' and 'a-plus' together account for only 5 rows. Six rows are 'unknown' and one 'not-applicable', so roughly 14% of values are non-informative sentinels that need handling.","role":"label","scope":"column","target":"ecoscore_grade","treatment":"Map sentinels ('unknown','not-applicable') to NA and treat the remaining tiers as an ordinal factor."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.median","stats.std","stats.q1","stats.q3","stats.iqr","stats.skew","stats.kurtosis","stats.n_outliers","stats.outlier_rate","stats.zero_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Numeric count of ingredients per record, ranging from 1 to 39 with a median of 9 and mean of 11.7. The distribution is right-skewed (skew 1.24, kurtosis 1.44) with a wide IQR of 11 and 2 outliers (4%) on the high end. No nulls or zeros, and 22 unique values across 50 rows suggest a discrete count variable.","role":"feature","scope":"column","target":"ingredients_n","treatment":"Consider log or sqrt transform before modelling to tame the right skew."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Categorical allergen tags using an Open Food Facts-style 'en:' prefix, often combined as comma-separated lists (e.g., 'en:gluten,en:milk,en:soybeans'). The most common value is an empty string at 32% (16/50), suggesting missing or no-allergen records encoded as blanks rather than nulls. With 16 unique values across 50 rows and entropy ratio 0.84, the distribution is fairly spread; gluten, milk, and soybeans dominate the non-empty tags.","role":"feature","scope":"column","target":"allergens","treatment":"Split on comma and multi-hot encode allergen tags; treat empty string as missing."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column was skipped by the profiler, so no statistics are available beyond a row count of 50 and a 0.0 null rate. The name suggests it holds tag-style annotations for minerals (likely a list or delimited string per row), but uniqueness, cardinality, and value distribution are all unknown here.","role":"other","scope":"column","target":"minerals_tags","treatment":"Re-profile with a parser appropriate for list/tag fields before deciding on use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text product name field with 49 unique values across 50 rows, near-maximal entropy ratio of 0.998 \u2014 effectively a per-row label. Values mix languages (French, English, Cyrillic) and formats (brand-only like 'Henry's' versus full descriptors like 'CRISTALINE Eau De Source 0.5L'), and one row is an empty string despite a reported null_rate of 0.0. The single repeat ('Henry's', 2) is the only signal preventing full uniqueness.","role":"free_text","scope":"column","target":"product_name","treatment":"Normalize casing and empty strings, then tokenize/embed rather than one-hot encode."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Free-form purchase location strings, often listing multiple places per row separated by commas. France dominates at 9/50 (18.4%), followed by an empty string (6) and Maroc (5), but with 32 unique values across 50 rows and entropy ratio 0.90, the long tail includes multi-country concatenations like 'Madrid,Espa\u00f1a,Montargis,France,W\u00fcrzburg,Deutschland,...'. Mixed languages (Maroc vs Morocco, Espa\u00f1a vs Spain) and embedded postal codes signal inconsistent data entry rather than a clean categorical.","role":"free_text","scope":"column","target":"purchase_places","treatment":"Split on commas and normalize each token to a canonical country before using as a multi-label feature."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This column records product quantities as free-text strings, dominated by gram weights but with no consistent format \u2014 '100 g', '100g', and '100 gram' all appear separately among the top values. With 36 unique values across 50 rows and entropy ratio 0.959, the field is highly fragmented; the most common value '100 g' covers only 12.2% of non-nulls, and 2% are null plus 2 empty strings. The long_tail alert reflects this unit/spacing inconsistency rather than genuine variety.","role":"feature","scope":"column","target":"quantity","treatment":"Normalize units and parse into a numeric grams column before use."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"The column `traces_tags` was skipped by the profiler, so no type, uniqueness, or distribution statistics are available. The only confirmed signals are 50 rows present and a null rate of 0.0, meaning every row has some value but its content and structure are unknown. The name suggests it may hold tag annotations associated with traces, possibly a nested or list-typed field that the profiler could not parse.","role":"other","scope":"column","target":"traces_tags","treatment":"Inspect raw values manually to determine structure before deciding whether to parse, explode, or drop."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a binary/flag column indicating UK origin, but it carries virtually no signal: 98% of the 50 rows are null and the only non-null value observed is an empty string. With cardinality of 1 and entropy of 0, the column has no discriminative power as it stands.","role":"feature","scope":"column","target":"origin_uk","treatment":"Drop; column is 98% null with a single empty-string value."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Arabic generic-name field that is overwhelmingly empty: 80% of the 50 rows are null and of the 10 populated rows, 9 are blank strings and only 1 carries an actual Arabic value (\u0627\u0644\u0627\u0645\u064a\u0631). With cardinality of just 2 and a top_rate of 0.9 on the empty string, this column carries almost no information as currently captured.","role":"metadata","scope":"column","target":"generic_name_ar","treatment":"Drop or defer until source data is backfilled; not usable as-is."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to be Ukrainian packaging text, but it is effectively empty: 98% of the 50 rows are null and the single non-null value is itself an empty string. Cardinality is 1 with zero entropy, so it carries no information.","role":"metadata","scope":"column","target":"packaging_text_uk","treatment":"Drop; the column has no usable signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Arabic-language ingredients text, populated for only 11 of 50 rows (null_rate 0.78) and with 10 of those 11 non-null entries being empty strings. Only one row carries an actual Arabic ingredient list, giving cardinality 2 and a top_rate of 0.91 on the empty string. Effectively unusable as a feature on this sample.","role":"free_text","scope":"column","target":"ingredients_text_ar","treatment":"Drop for modelling; retain only if you specifically need Arabic ingredient parsing and can source more populated rows."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.cardinality","stats.entropy","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Ukrainian-language ingredients text, almost entirely absent in this sample. 98% of rows are null and the single non-null value is an empty string, leaving zero usable content. Entropy is 0 and cardinality is 1, so the column carries no signal here.","role":"free_text","scope":"column","target":"ingredients_text_uk","treatment":"Drop from this slice; revisit only if a Ukrainian-locale subset is loaded."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column was skipped by the profiler, so no type, uniqueness, or distribution statistics are available beyond a row count of 50 and a null rate of 0.0. The name suggests it stores tags associated with last-check dates, possibly a list or composite field that the dissector could not parse. Without further stats, nothing can be said about its values.","role":"other","scope":"column","target":"last_check_dates_tags","treatment":"Inspect raw values manually and re-profile after parsing into a structured type."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This looks like a checkbox-style flag (likely from a web form), where the only observed value is \"on\" in 7 of 50 rows. The remaining 86% are null, and entropy is 0.0 because there is no variation among the non-null entries. With cardinality of 1, the column carries no discriminative signal as captured.","role":"feature","scope":"column","target":"checked","treatment":"Convert to a boolean (on vs null) or drop, since it has only one observed value."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be Arabic-language packaging text, but it carries no information in this sample: 80% of the 50 rows are null and the remaining 10 values are all empty strings, giving cardinality 1 and entropy 0. There is nothing to model or join on here.","role":"free_text","scope":"column","target":"packaging_text_ar","treatment":"Drop; the column is effectively constant-empty with 80% nulls."},{"confidence":"medium","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.min","stats.max","stats.median","stats.skew","stats.n_outliers"],"model":"anthropic:claude-opus-4-7","narrative":"Numeric coverage metric indicating the share of an item's known ingredients that have a carbon footprint estimate, ranging from 8.0 to 105.0 with a median of 70.0. The 62% null rate is the dominant signal \u2014 only 19 distinct values populate this column across 50 rows, so most records lack any coverage figure at all. The max of 105.0 is mildly surprising for what reads like a percentage, and the distribution is slightly left-skewed (skew -0.45) with no flagged outliers.","role":"feature","scope":"column","target":"carbon_footprint_percent_of_known_ingredients","treatment":"Impute or add a missingness indicator before modelling, and verify whether values above 100 are valid."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This looks like the username of the last reviewer/checker on a record, with only 4 distinct values across 50 rows. The column is 86% null, so just 7 rows carry a value, and 'aleene' accounts for 3 of those (top_rate 0.43). Entropy ratio of 0.92 indicates the few present values are spread fairly evenly across the small handful of checkers.","role":"metadata","scope":"column","target":"last_checker","treatment":"Treat missingness as a 'never checked' category; too sparse to use as a model feature."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Ukrainian-language product name field that is effectively empty: 98% of the 50 rows are null and the single non-null value is itself an empty string, giving a cardinality of 1 and entropy of 0. There is no usable signal here whatsoever.","role":"metadata","scope":"column","target":"product_name_uk","treatment":"Drop the column; it carries no information."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","n","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a UK-localized generic product name field, but it is effectively empty in this sample: 98% of the 50 rows are null and the only non-null value is an empty string. Cardinality is 1 with zero entropy, so the column carries no information here.","role":"metadata","scope":"column","target":"generic_name_uk","treatment":"Drop; no usable signal at this null rate and cardinality."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","top_values","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"Arabic-language product name field that is mostly absent: 78% null and only 6 distinct values across 50 rows. The non-null entries are a language mix \u2014 one Arabic string (\u0628\u0631\u0646\u0633) alongside Spanish and English names like 'Leche Y Almendras' and 'Chocolate Negro 92% Cacao' \u2014 suggesting the column is not consistently populated with Arabic translations. The most frequent observed value is an empty string (6 occurrences, 54.5% of non-nulls), indicating empties coexist with true nulls.","role":"metadata","scope":"column","target":"product_name_ar","treatment":"Drop or defer until translation coverage improves; normalise empty strings to null and validate language before use."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Debug trace string showing the per-ingredient carbon footprint computation (percentage \u00d7 emission factor = grams) for each product. Every one of the 14 non-null values is unique (entropy_ratio \u2248 1.0, top_rate 0.07), and 72% of rows are null, so it functions as a verbose audit log rather than a feature.","role":"metadata","scope":"column","target":"carbon_footprint_from_known_ingredients_debug","treatment":"Drop from modelling; retain only for auditing the carbon calculation."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.min","stats.max","stats.skew","stats.n_outliers"],"model":"anthropic:claude-opus-4-7","narrative":"Values are Unix epoch seconds ranging from 1540933974 to 1730226344, consistent with 'last checked' timestamps spanning roughly late 2018 to late 2024. Severe sparsity dominates: null_rate is 0.86 and only 7 unique values populate the 50 rows, so this column is barely usable as-is. Distribution is mildly right-skewed (skew 0.81) with no outliers flagged.","role":"timestamp","scope":"column","target":"last_checked_t","treatment":"Convert from epoch seconds to datetime and treat as mostly-missing; impute or drop before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a UK-localized variant of an ingredients-with-allergens text field, but it is effectively empty in this sample. 98% of the 50 rows are null, and the single non-null value is itself an empty string, giving cardinality 1 and zero entropy. There is no usable signal here.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_uk","treatment":"Drop; no observed values in this sample."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Arabic-language ingredients text (with allergen markup) for food products. The column is 82% null across just 50 rows, and of the 9 non-null entries 8 are empty strings \u2014 only 1 row carries an actual ingredient list. Effectively no usable signal at this sample size.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_ar","treatment":"Drop for now; revisit only if a larger Arabic-localized sample becomes available."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Categorical field 'origin_ar' carries a single observed value (an empty string) across the 10 non-null rows, while 80% of records are null. With cardinality 1 and entropy 0, the column conveys no information in this sample.","role":"metadata","scope":"column","target":"origin_ar","treatment":"Drop; the column is 80% null and constant on the remainder."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"The column `nutriments_estimated` was skipped by the profiler, so no type, uniqueness, or distribution stats are available. The only facts on record are that all 50 sampled rows are non-null and the kind is unknown. Without further evidence, the content and structure of this field cannot be characterised.","role":"other","scope":"column","target":"nutriments_estimated","treatment":"Re-profile with an appropriate parser before deciding on downstream use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.std"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a binary warning flag indicating a missing-fiber condition in a nutrition score, encoded as 1 when triggered. Every one of the 15 non-null rows holds the value 1.0, and 70% of rows are null \u2014 consistent with a sparse flag that is only populated when the warning fires. With zero variance, it carries no discriminative signal as-is.","role":"feature","scope":"column","target":"nutrition_score_warning_no_fiber","treatment":"Recode nulls to 0 to convert into a usable binary indicator, or drop if still constant after recoding."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","column","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column, named `ingredients_text_debug_tags`, was skipped by the profiler so no distributional statistics are available. The name suggests it holds debugging tags emitted by an ingredients-text parser, likely a list or sparse string field. With 50 rows observed and a 0.0 null rate reported but no unique count or value stats, nothing further can be inferred from the evidence.","role":"metadata","scope":"column","target":"ingredients_text_debug_tags","treatment":"Inspect raw values manually; likely drop unless debugging the ingredients parser."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","n_unique","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'taxonomies_enhancer_tags' was skipped by the profiler, so no type, uniqueness, or distributional statistics are available beyond a row count of 50 and a null rate of 0.0. Without kind detection or value samples, its content (likely some form of taxonomy/tag payload based on the name) cannot be verified from the evidence.","role":"other","scope":"column","target":"taxonomies_enhancer_tags","treatment":"Re-profile with parsing enabled (likely a nested/list field) before deciding on use."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.min","stats.max","stats.median","stats.skew","n_unique","stats.n_outliers"],"model":"anthropic:claude-opus-4-7","narrative":"Values are 10-digit integers ranging from 1628199203 to 1763195431, consistent with Unix epoch seconds spanning roughly 2021 through 2025 \u2014 almost certainly a 'completed at' timestamp. The 68% null rate is the dominant signal, suggesting most records were never completed. Distribution across the non-null 16 unique values is near-symmetric (skew ~0.001) with no outliers.","role":"timestamp","scope":"column","target":"completed_t","treatment":"Convert from epoch seconds to datetime and treat nulls as 'not yet completed' rather than imputing."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_value","top_values","stats.cardinality"],"model":"anthropic:claude-opus-4-7","narrative":"This is a Bulgarian-language product name field, with values like '\u0428\u043e\u043a\u043e\u043b\u0430\u0434 85% \u043a\u0430\u043a\u0430\u043e\u0432\u0430 \u043c\u0430\u0441\u0430' indicating localized chocolate/cocoa product labels. It is 94% null across 50 rows, leaving only 3 non-null entries that are all unique. With so little populated data, this column carries almost no analytical signal in its current state.","role":"metadata","scope":"column","target":"product_name_bg","treatment":"Drop or defer until Bulgarian localization coverage improves; too sparse to use."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text ingredient lists ostensibly tagged as Estonian (et), but the three observed values mix Slovenian, German, and Estonian, suggesting mislabeled locale tagging. The field is 94% null with only 3 non-null entries out of 50, so any signal here is anecdotal at best.","role":"free_text","scope":"column","target":"ingredients_text_et","treatment":"Drop or defer; too sparse and language-inconsistent to model without a language-detection cleanup pass."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"The column appears to be an origin identifier or location code, but it is effectively empty in this sample. 98% of the 50 rows are null, and the single non-null value is itself a blank string, leaving cardinality at 1 and entropy at 0.","role":"metadata","scope":"column","target":"origin_sl","treatment":"Drop; the column carries no usable signal at this null rate."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a localized (Algerian/Dzongkha?) generic-name field, but it is effectively empty: 98% of the 50 rows are null, and the single non-null value is itself an empty string. Cardinality is 1 with zero entropy, so the column carries no information.","role":"metadata","scope":"column","target":"generic_name_dz","treatment":"Drop; no signal (98% null, single empty-string value)."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Slovenian-language ingredients text, almost entirely empty: 98% null with only 1 non-null value across 50 rows. The single observed entry is a free-form product label (cocoa-based confection) rather than a controlled vocabulary, so the categorical framing is misleading.","role":"free_text","scope":"column","target":"ingredients_text_sl","treatment":"Drop for modelling; if needed, treat as free text and merge with other-language ingredient fields."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values","n","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Catalan-language generic product name field, but it is effectively empty: 96% of rows are null and the only non-null value observed is the empty string (2 occurrences). Cardinality is 1 with zero entropy, so the column carries no information in this sample.","role":"metadata","scope":"column","target":"generic_name_ca","treatment":"Drop; the column is 96% null with a single empty-string value."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","top_value","top_rate","cardinality"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Dzongkha-language ingredients text field, likely a localized variant of a multilingual product description column. Out of 50 rows, 98% are null and the single non-null value is an empty string, leaving zero usable content.","role":"free_text","scope":"column","target":"ingredients_text_dz","treatment":"Drop; effectively empty in this sample."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Catalan-language product name field, but it is effectively empty: 96% of the 50 rows are null and the only 2 non-null values are blank strings, giving a single observed category with entropy 0. There is no usable signal here.","role":"metadata","scope":"column","target":"product_name_ca","treatment":"Drop the column; it is 96% null with no distinct values."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Canadian-origin flag or code field, but it's effectively empty: 96% of the 50 rows are null, and the only 2 non-null values are both blank strings. With cardinality of 1 and entropy of 0, the column carries no information.","role":"feature","scope":"column","target":"origin_ca","treatment":"Drop; the column is 96% null and the remaining values are empty strings."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_values","stats.entropy_ratio","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"Estonian-localized product name field, but 94% of the 50 rows are null and only 3 distinct values appear among the remainder \u2014 including one empty string and two names that are actually French and English, not Estonian. With each surviving value occurring exactly once (entropy_ratio 1.0), this column carries almost no usable signal and shows a language-tagging mismatch.","role":"metadata","scope":"column","target":"product_name_et","treatment":"Drop from modelling; revisit upstream localization pipeline since values aren't in Estonian."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_values","stats.cardinality","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Bulgarian-language ingredient lists with inline HTML allergen markup (<span class=\"allergen\">), localised for the bg market. Coverage is extremely thin: 94% null and only 3 distinct values across 50 rows, one of which is an empty string. The two real entries are confectionery ingredient declarations mentioning soy, hazelnuts and milk allergens.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_bg","treatment":"Strip the HTML tags and treat as free text; too sparse (94% null) to use as a feature without aggregation across locales."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","cardinality","top_values","top_value"],"model":"anthropic:claude-opus-4-7","narrative":"Estonian-localised ingredient text with allergen markup, but only 3 of 50 rows carry a value (null_rate 0.94) and all three are unique \u2014 and not even in Estonian (one Slovenian, one German, plus one short Estonian entry). The field is essentially empty and the few populated rows show a language mix rather than the expected `et` locale, suggesting upstream localisation fallback or mislabelling.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_et","treatment":"Drop unless you specifically need allergen extraction; 94% nulls and inconsistent language make it unusable as-is."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"`origin_sk` appears to be a surrogate key for an origin entity, but it carries almost no information in this slice: 98% of the 50 rows are null and the single non-null value is an empty string. Cardinality is 1 and entropy is 0, so the column is effectively constant where populated.","role":"foreign_key","scope":"column","target":"origin_sk","treatment":"Drop from modelling; investigate upstream join before relying on it."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be an origin block-group identifier, likely a geographic foreign key. It is effectively unusable here: 94% of rows are null, and the only 1 distinct value observed across the 50 rows is the empty string (3 occurrences), giving entropy 0.0.","role":"foreign_key","scope":"column","target":"origin_bg","treatment":"Drop; no usable signal at this null rate and cardinality."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","n","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Slovenian-language packaging text field, but it is effectively empty: 98% of the 50 rows are null and the single non-null value is an empty string, giving cardinality 1 and entropy 0. There is no usable signal here.","role":"free_text","scope":"column","target":"packaging_text_sl","treatment":"Drop; the column is 98% null with only an empty-string value otherwise."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","n","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"Likely a surrogate key linking to a generic drug name dimension, but it is effectively empty in this sample. 98% of rows are null and the single non-null value is the empty string, giving cardinality 1 and zero entropy.","role":"foreign_key","scope":"column","target":"generic_name_sk","treatment":"Drop or defer until a non-empty sample is available; carries no signal here."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Slovenian-language ingredients list with embedded allergen HTML markup (`<span class=\"allergen\">`), likely a localized product label field. The column is almost entirely empty with a null_rate of 0.98, leaving only 1 non-null row out of 50, and that single value is the only unique entry (cardinality 1, entropy 0.0). With essentially no signal and HTML mixed into the text, it carries no analytical value as-is.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_sl","treatment":"Drop; 98% null and only one observed value make it unusable, or strip HTML and reserve for text extraction if more rows arrive."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Catalan-language ingredients text field, almost entirely absent from this sample. 96% of the 50 rows are null and the only 2 non-null values are empty strings, giving a single distinct value and zero entropy.","role":"free_text","scope":"column","target":"ingredients_text_ca","treatment":"Drop; the column carries no usable signal in this sample."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to be a Slovenian-language generic name field that is effectively empty in this sample. With a 98% null rate and the only non-null value being an empty string, there is zero usable signal (entropy 0.0, cardinality 1).","role":"metadata","scope":"column","target":"generic_name_sl","treatment":"Drop; no usable values present."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a localized product name field (Dzongkha or similar locale suffix), but it is effectively empty: 98% of the 50 rows are null and the single non-null value is itself an empty string. Cardinality is 1 with zero entropy, so the column carries no usable signal in this sample.","role":"metadata","scope":"column","target":"product_name_dz","treatment":"Drop; the column is 98% null with a single empty-string value."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"`origin_et` appears to be a categorical metadata field, but it carries almost no information here: 94% of the 50 rows are null and the only non-null value observed is the empty string, which accounts for all 3 populated rows. Cardinality is 1 and entropy is 0, so the column is effectively constant where present.","role":"metadata","scope":"column","target":"origin_et","treatment":"Drop; constant empty value with 94% nulls offers no signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Column appears to be a surrogate key for ingredient text with allergen markup, but it is effectively empty: 98% of 50 rows are null and the only observed value is the empty string. Cardinality is 1 with zero entropy, so there is no usable signal here.","role":"identifier","scope":"column","target":"ingredients_text_with_allergens_sk","treatment":"Drop; the column is 98% null with a single empty value."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Almost certainly a Slovak product name field that is effectively empty in this slice \u2014 98% of the 50 rows are null and the single non-null value is itself an empty string, leaving cardinality at 1 and entropy at 0. There is no usable signal here whatsoever.","role":"free_text","scope":"column","target":"product_name_sk","treatment":"Drop; the column is 98% null with only an empty string observed."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.top_value","stats.top_rate","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Portuguese-language ingredient lists with embedded HTML allergen tags (<span class=\"allergen\">\u2026</span>), likely scraped from a food product database. The column is sparsely populated with an 0.84 null rate, and among the 8 non-null rows 5 are empty strings, leaving only 3 genuine ingredient declarations. Each non-empty value is unique and contains raw HTML markup rather than cleaned text.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_pt","treatment":"Strip HTML tags to extract allergen tokens, then treat as sparse free text; too null-heavy for direct modelling."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"Localized ingredients text with allergens for Catalan, but it's effectively empty in this sample: 98% null and the only non-null value observed is itself an empty string. With cardinality of 1 and entropy 0, this column carries no information here.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_ca","treatment":"Drop; no usable signal in this slice."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Portuguese-language generic product name, present for only 20% of the 50 rows (null_rate 0.8) and otherwise dominated by an empty string (top_rate 0.8 on value ''). Among the 10 non-null entries only 2 distinct strings appear in the top values, both descriptive food labels like 'Chocolate extrafino com 70% de cacau'. Coverage is too thin and cardinality too low (n_unique 3 including the blank) to support modelling on its own.","role":"free_text","scope":"column","target":"generic_name_pt","treatment":"Drop or retain only as a fallback display label; coverage is too sparse to feature-engineer."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Portuguese packaging-text field, likely free-form descriptions of product packaging. It is effectively empty: 80% of the 50 rows are null, and the remaining 10 rows all hold the empty string, leaving cardinality at 1 and entropy at 0. There is no usable signal here.","role":"free_text","scope":"column","target":"packaging_text_pt","treatment":"Drop the column; it carries no information."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_value","top_rate","top_values","stats.cardinality"],"model":"anthropic:claude-opus-4-7","narrative":"Portuguese-language ingredient lists for food products, stored as free text. The column is mostly empty: 80% null and the most common value (7 of 50 rows) is an empty string, leaving only 4 distinct values across 50 rows. The few populated entries are long, comma-separated ingredient declarations with allergen tokens in caps or underscores.","role":"free_text","scope":"column","target":"ingredients_text_pt","treatment":"Treat as free text: drop or impute the empty majority, then tokenize and parse ingredients before modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be an origin point identifier, but it carries no usable signal in this sample. 80% of rows are null and the remaining 10 rows all hold the same empty-string value, giving a single unique category and entropy of 0.","role":"metadata","scope":"column","target":"origin_pt","treatment":"Drop; the column is 80% null and the rest is a constant empty string."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.min","stats.max","stats.mean","stats.std"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a flag indicating that the nutrition score warning was estimated from nutriment data, likely a 0/1 boolean. Of 50 rows, 96% are null and the remaining 4% all carry the value 1.0, making it effectively constant where present. With no variation and almost no coverage, it carries no usable signal.","role":"feature","scope":"column","target":"nutrition_score_warning_nutriments_estimated","treatment":"Drop; constant-when-present and 96% null."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Likely Bulgarian-language packaging text from a product database. The column is effectively empty: 94% null and the only non-null value across 50 rows is the empty string itself (3 occurrences), giving cardinality 1 and zero entropy.","role":"free_text","scope":"column","target":"packaging_text_bg","treatment":"Drop; no usable signal at this sample size."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be an Estonian-language generic name field, but it carries no usable signal in this sample: 94% of rows are null and the only non-null value observed is the empty string (3 occurrences), giving cardinality 1 and entropy 0. Effectively every record is missing or blank.","role":"metadata","scope":"column","target":"generic_name_et","treatment":"Drop; column is 94% null with a single empty-string value otherwise."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Likely a Canadian-locale packaging text field from a product catalog. It is effectively empty: 96% null and the only 2 non-null values are both blank strings, giving a single distinct value and zero entropy.","role":"metadata","scope":"column","target":"packaging_text_ca","treatment":"Drop; the column carries no signal at this sample size."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Localized Slovenian product name field that is effectively empty: 98% of 50 rows are null and the single populated row reads \"ARRIBA 85% cacao\". With cardinality 1 and entropy 0, this column carries no usable signal in the current sample.","role":"metadata","scope":"column","target":"product_name_sl","treatment":"Drop from modelling; revisit only if a fuller localized catalogue becomes available."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Bulgarian-language generic drug name field, but it is effectively empty: 94% of the 50 rows are null and the only non-null value observed is the empty string itself, repeated 3 times. Cardinality is 1 with zero entropy, so the column carries no information.","role":"metadata","scope":"column","target":"generic_name_bg","treatment":"Drop; the column is 94% null with a single empty-string value."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Slovak-language ingredients text field (suffix _sk), but it is effectively empty in this sample: 98% of 50 rows are null and the single non-null value is an empty string, yielding cardinality 1 and entropy 0.","role":"free_text","scope":"column","target":"ingredients_text_sk","treatment":"Drop; no usable signal at this sample size."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_values","stats.cardinality","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Bulgarian-language ingredient lists for food products, stored as free text in Cyrillic. The column is almost entirely empty (null_rate 0.94) with only 3 non-null values across 50 rows, each unique \u2014 effectively unusable as a categorical feature. Despite the categorical kind label, the content is long-form ingredient prose, not a discrete category.","role":"free_text","scope":"column","target":"ingredients_text_bg","treatment":"Drop unless doing multilingual text analysis; 94% null leaves too little signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Estonian packaging text field that is effectively empty: 94% of 50 rows are null, and the only non-null value observed is the empty string itself (3 occurrences). With cardinality of 1 and entropy of 0, this column carries no information.","role":"free_text","scope":"column","target":"packaging_text_et","treatment":"Drop; no usable signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a surrogate key for packaging text, but it is essentially empty: 98% of the 50 rows are null and the single non-null value is an empty string, leaving cardinality at 1 and entropy at 0. There is no usable signal here.","role":"foreign_key","scope":"column","target":"packaging_text_sk","treatment":"Drop; 98% null and only one observed value."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","top_value","top_rate","top_values","stats.entropy_ratio"],"model":"anthropic:claude-opus-4-7","narrative":"This is a Portuguese-localized product name field, but it is mostly empty: 80% null and only 7 distinct values across 50 rows, with the top value being the empty string at 40%. The non-null entries are a language mix (Portuguese, Italian, French, English) rather than purely Portuguese, suggesting fallback to original-language labels when no translation exists. Entropy ratio of 0.90 reflects that the few present values are nearly all unique.","role":"free_text","scope":"column","target":"product_name_pt","treatment":"Drop or treat as optional metadata; too sparse and language-inconsistent for direct modelling."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Likely a French abbreviated product name field (brand + descriptor + size), used as a display label for items. The column is mostly empty with a null_rate of 0.86, leaving only 7 unique values across 50 rows, each appearing once \u2014 entropy_ratio is 1.0, so among the populated rows every value is distinct. Sparsity makes it unusable as a categorical feature in its current state.","role":"label","scope":"column","target":"abbreviated_product_name_fr","treatment":"Drop or treat as free text; too sparse and unique to encode as a category."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a boolean-style flag indicating whether a record was imported as obsolete, but the signal is effectively absent: 86% of rows are null and the only observed value is \"0\" across all 7 non-null entries. Cardinality is 1 with zero entropy, so the column carries no discriminative information in this sample.","role":"feature","scope":"column","target":"obsolete_imported","treatment":"Drop; constant value with 86% nulls offers no modelling signal."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","n_unique","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `sources_fields` was skipped by the profiler, so its kind, cardinality, and value statistics are all unavailable. The only confirmed signals are 50 rows present with a null rate of 0.0, meaning every row has some value, but nothing is known about what those values look like. Without further inspection this column cannot be characterised.","role":"other","scope":"column","target":"sources_fields","treatment":"Re-profile or manually inspect a sample before deciding on downstream use."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.top_value","stats.top_rate","stats.entropy"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be an embargo or embarkation code, with values like \"EMB 44068 A\" suggesting an alphanumeric reference identifier. The column is almost entirely empty: 98% null across 50 rows, leaving a single non-null observation. With only one value present, entropy is 0 and no distributional inference is possible.","role":"metadata","scope":"column","target":"emb_code","treatment":"Drop; 98% null with only one observed value provides no signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Likely a language tag for imported records, but 86% of the 50 rows are null and the remaining 7 entries are all 'fr'. With only one observed value, entropy is 0 and the column carries no discriminative signal as captured.","role":"metadata","scope":"column","target":"lang_imported","treatment":"Drop or hold aside until more non-null values arrive; constant 'fr' with 86% nulls is unusable as a feature."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Chinese generic-name field, but it is effectively empty: 98% of the 50 rows are null and the single non-null observation is itself an empty string. Cardinality is 1 with zero entropy, so the column carries no usable signal in this sample.","role":"metadata","scope":"column","target":"generic_name_zh","treatment":"Drop; the column is 98% null with a single empty-string value."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds French-language storage instructions imported from an external source (e.g., 'A conserver de pr\u00e9f\u00e9rence \u00e0 l'abri du soleil...'). Coverage is extremely sparse: 86% null and only 7 distinct phrasings across 7 non-null rows, each appearing exactly once. The values are free-text variants of the same advice rather than a controlled vocabulary, so entropy_ratio sits at 1.0.","role":"free_text","scope":"column","target":"conservation_conditions_fr_imported","treatment":"Drop or normalise via keyword extraction; too sparse and too variable to use as a categorical feature."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a French-language origin/import provenance field, with values ranging from a single country tag (\"France\") to a multi-line description of cocoa paste sourcing across continents. Only 2 of 50 rows are populated (null_rate 0.96), and both populated values are unique, giving entropy_ratio 1.0 over a cardinality of 2. The mix of a clean country label with a long descriptive string suggests inconsistent data entry rather than a true categorical.","role":"free_text","scope":"column","target":"origin_fr_imported","treatment":"Drop or defer; 96% null and entries mix country codes with prose, so not usable as a category without manual normalisation."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Categorical column listing the owning organization (food/beverage manufacturers like Barilla, Ferrero, Nestl\u00e9) for each record. The column is overwhelmingly empty: 86% null, leaving only 7 populated rows spread across 6 distinct owners, with Barilla appearing twice and the rest singletons. Entropy ratio of 0.98 confirms the non-null values are nearly uniform, so there is little signal beyond identifying who submitted the entry.","role":"metadata","scope":"column","target":"owner","treatment":"Drop or retain as provenance metadata only; too sparse for modelling."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.entropy_ratio","stats.top_rate","stats.cardinality","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"French-language ingredient declarations imported from an external source, with each non-null value being a long free-text recipe listing (allergens capitalised, percentages, additive codes). The column is 86% null and the 7 present values are all unique, yielding maximum entropy (entropy_ratio 1.0) and a top_rate of just 0.14. This is unstructured product copy, not a category, despite being typed as categorical.","role":"free_text","scope":"column","target":"ingredients_text_fr_imported","treatment":"Treat as free text: parse ingredient lists or tokenize/embed for NLP rather than one-hot encoding."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","top_value","top_rate","entropy_ratio","top_values","n"],"model":"anthropic:claude-opus-4-7","narrative":"Categorical tag identifying the owning organization for each record, with values like 'org-barilla-france-sa' and 'org-nestle-france' suggesting Open Food Facts-style contributor org slugs. The column is 86% null, leaving only 7 populated rows spread across 6 distinct owners, so entropy ratio is near-saturated (0.976) and the top value covers just 2 records. With this much sparsity it carries almost no signal at n=50.","role":"metadata","scope":"column","target":"owners_tags","treatment":"Drop or retain only as a provenance tag; too sparse to use as a feature."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Chinese product name field that is effectively empty in this sample: 98% of the 50 rows are null, and the single non-null value is itself an empty string. Cardinality is 1 with zero entropy, so the column carries no usable signal here.","role":"metadata","scope":"column","target":"product_name_zh","treatment":"Drop from modelling; revisit only if a larger sample shows actual Chinese strings populated."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to be metadata indicating the basis on which nutrition data was prepared, with the only observed value being '100g'. It is essentially a constant: 86% of rows are null and the remaining 7 entries all share the single value '100g', giving zero entropy.","role":"metadata","scope":"column","target":"nutrition_data_prepared_per_imported","treatment":"Drop; constant column with no information."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_value","top_rate","entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a French-language abbreviated product name field, likely imported from an external catalog. It is overwhelmingly empty with a null_rate of 0.86, leaving only 7 distinct values across 50 rows, each appearing once (top_rate 0.143, entropy_ratio 1.0). The few populated entries mix brand-led formats like \"CRISTALINE Eau De Source 0.5L\" and \"NESTLE DESSERT Noir 205g\" with locale tags such as \"Authentique 275g, fr\".","role":"metadata","scope":"column","target":"abbreviated_product_name_fr_imported","treatment":"Drop or defer; too sparse (86% null) and unique to model directly."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to be a debug-tag field associated with Chinese generic names, but saturn skipped profiling so no value-level statistics are available. The only confirmed signals are 50 rows with a 0.0 null rate; uniqueness, distribution, and content are unknown.","role":"metadata","scope":"column","target":"generic_name_zh_debug_tags","treatment":"Re-profile or inspect manually before use; likely drop as debug instrumentation."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds French-language customer service contact details (postal addresses or web contact URLs) for product manufacturers. It is overwhelmingly empty with an 86% null rate, leaving only 7 non-null values across 6 nearly-unique strings (entropy ratio 0.976), with the top entry \u2014 a Wasa contact URL \u2014 appearing just twice. The values are unstructured free text mixing URLs, company names, and postal addresses.","role":"free_text","scope":"column","target":"customer_service_fr","treatment":"Drop or treat as sparse metadata; not usable as a categorical feature given 86% nulls and near-unique values."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_values","stats.cardinality","stats.entropy_ratio"],"model":"anthropic:claude-opus-4-7","narrative":"This column holds French-language customer service contact details (postal addresses or web contact URLs) for product manufacturers, imported as free-form strings. It is 86% null with only 7 populated rows yielding 6 distinct values, so it functions more as sparse metadata than an analytical feature. Entries vary in format from full postal addresses (Nestl\u00e9, Ferrero, Cristaline) to URLs, indicating no normalization upstream.","role":"metadata","scope":"column","target":"customer_service_fr_imported","treatment":"Drop for modelling; retain only if needed as a manufacturer contact lookup."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column is flagged as kind \"unknown\" and was skipped by the profiler, so no statistics, uniqueness, or value samples are available. The only confirmed signals are 50 rows present and a 0.0 null rate. The name suggests it holds debug tags from Chinese-language ingredient text parsing, but that is inferred from the column name, not the evidence.","role":"metadata","scope":"column","target":"ingredients_text_zh_debug_tags","treatment":"Drop unless debug tags are explicitly needed; re-profile with a parser that handles this type before use."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"French-language product names imported from an external source, judging by the suffix and the values like 'CRISTALINE Eau De Source 0.5L' and 'Biscuits Nutella x22 biscuits fourr\u00e9s - 304g'. Only 7 of 50 rows carry a value (null_rate 0.86), and every populated value is unique (entropy_ratio 1.0, top_rate 0.143), so this behaves as free-text rather than a category. The extreme nullity combined with full uniqueness makes it unusable as a grouping key.","role":"free_text","scope":"column","target":"product_name_fr_imported","treatment":"Treat as sparse free text\u2014drop for modelling or tokenize/embed if product identification is needed."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.top_value","stats.top_rate","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a free-text brand field listing imported product brands, with 6 distinct values across only 7 non-null rows out of 50 (null_rate 0.86). The top value 'Wasa' appears just twice (top_rate 0.286), and entropy_ratio 0.976 indicates the few present values are nearly uniformly distributed. One entry 'NESTLE DESSERT,Tablettes' looks like a comma-joined multi-value string, suggesting inconsistent encoding.","role":"feature","scope":"column","target":"brands_imported","treatment":"Split multi-value strings on comma and treat as low-coverage categorical; consider dropping given 86% nulls."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_values","stats.entropy_ratio","stats.top_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Categorical column holding organisation slugs (e.g. 'org-barilla-france-sa', 'org-nestle-france'), almost certainly a foreign key to an owning company. It is 88% null with only 6 non-null rows spread across 5 distinct owners, so entropy_ratio is 0.97 simply because nearly every present value is unique. The column is too sparse to support any aggregation or join in its current state.","role":"foreign_key","scope":"column","target":"owner_imported","treatment":"Drop or defer: 88% null leaves too few rows to join or model on."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to be an internal debug-tagging field attached to Chinese product names, but saturn skipped profiling so its contents are opaque. The only confirmed facts are 50 rows with no nulls; uniqueness, value distribution, and type are all unreported. Without a profile pass it is impossible to tell whether it carries useful signal or just developer annotations.","role":"metadata","scope":"column","target":"product_name_zh_debug_tags","treatment":"Re-run profiling with this kind enabled before deciding; provisionally drop as unparsed debug metadata."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"A categorical flag indicating the source language of imported records, with values 'fr' and 'es'. The column is dominated by missingness \u2014 84% null across 50 rows \u2014 and among the 8 populated rows, 'fr' accounts for 7 (87.5%), leaving 'es' as a single observation. Cardinality is just 2, so this carries little signal in its current state.","role":"metadata","scope":"column","target":"lc_imported","treatment":"Treat nulls as a category or drop; near-constant with severe missingness limits modelling value."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Chinese-language ingredients text field, likely from a localized product/food dataset. It is effectively empty: 98% of the 50 rows are null and the only non-null value observed is itself an empty string, giving a cardinality of 1 and entropy of 0.","role":"free_text","scope":"column","target":"ingredients_text_zh","treatment":"Drop; no usable signal at this sample size."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a free-form quantity/packaging size field mixing volume ('500 ml') and mass units ('304 g', '275 g'), stored as strings rather than parsed numerics. Coverage is extremely poor: 86% of the 50 rows are null, and among the 7 non-null values every one is unique (entropy_ratio 1.0, top_rate 0.14). With no repeated values and mixed units, it offers little categorical signal as-is.","role":"feature","scope":"column","target":"quantity_imported","treatment":"Parse into a numeric magnitude plus a unit column before use; given 86% nulls, consider dropping or imputing."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.top_value","stats.top_rate","stats.entropy","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Likely a metadata flag indicating the basis on which nutrition values were imported, with '100g' as the sole observed value across all 8 non-null rows. The column is 84% null and has only one unique value, giving zero entropy and no discriminative power.","role":"metadata","scope":"column","target":"nutrition_data_per_imported","treatment":"Drop; constant value with 84% nulls carries no signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy_ratio","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"French generic product names imported from an upstream source (e.g. Open Food Facts), holding descriptors like \"Eau De Source\" and \"Biscuit fourr\u00e9 \u00e0 la p\u00e2te \u00e0 tartiner aux noisettes et au cacao Nutella\u00ae\". The column is 86% null and every one of the 7 observed values is unique (entropy_ratio 1.0), so it behaves as free-text rather than a categorical feature. Values are in French with accented characters and brand marks, which will need normalisation if joined with other locales.","role":"free_text","scope":"column","target":"generic_name_fr_imported","treatment":"Treat as multilingual free text: normalise accents and tokenize/embed if used; otherwise drop given 86% nulls."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","n_unique","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column `owner_fields` was skipped by the profiler, so its kind is unknown and no descriptive statistics, uniqueness, or value samples are available. The only signals are a row count of 50 and a null rate of 0.0, meaning every row is populated but the contents are opaque from this evidence alone. Without a sample or type inference, nothing can be said about what the field encodes.","role":"other","scope":"column","target":"owner_fields","treatment":"Re-profile with parsing enabled (or inspect raw values) before deciding how to use this column."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Hierarchical product category paths (comma-separated taxonomy strings, mostly French with some en: prefixes) imported from an external source, likely Open Food Facts. The column is 88% null with only 6 non-null rows across 5 distinct values, so coverage is too sparse to be useful as-is. Entropy ratio of 0.97 confirms the few present values are nearly all distinct, and the top value appears just twice.","role":"metadata","scope":"column","target":"categories_imported","treatment":"Split on comma into hierarchical levels and use only the top level as a feature, or drop given 88% nulls."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.entropy_ratio","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"French-language storage instructions for products, written as free-form sentences (e.g. \"A conserver dans un endroit sec \u00e0 l'abri de la lumi\u00e8re.\"). Coverage is very thin: 86% null and only 7 distinct strings across 50 rows, each appearing exactly once, so entropy_ratio is 1.0. Despite semantic overlap (cool, dry, away from light), no two entries are phrased identically, making this unusable as a category without normalisation.","role":"free_text","scope":"column","target":"conservation_conditions_fr","treatment":"Treat as free text: normalise/cluster phrases or extract keywords (sec, frais, lumi\u00e8re) rather than one-hot encoding."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","n","top_value","top_rate","entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text French storage instructions for a product (e.g., \"A conserver \u00e0 l'abri du soleil...\"), captured as a categorical field. With 86% nulls and only 7 distinct values across 50 rows \u2014 each appearing exactly once \u2014 this behaves like sparse free text rather than a controlled vocabulary. Maximum entropy ratio (1.0) confirms every observed value is unique.","role":"free_text","scope":"column","target":"conservation_conditions","treatment":"Treat as free text; normalize/keyword-extract (e.g., 'sec', 'frais', 'abri') or drop given 86% nulls."},{"confidence":"medium","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Likely a country-of-origin tag for imported items, but with 84% nulls only 8 of 50 rows actually carry a value. Of those, 7 are 'France' and 1 is 'Espa\u00f1a', giving a top_rate of 0.875 and just 2 distinct categories. The mixed language ('Espa\u00f1a' vs the English column name) hints at inconsistent source encoding.","role":"metadata","scope":"column","target":"countries_imported","treatment":"Impute or flag missingness and normalise country names to a single language before any grouping."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a French-language origins field listing geographic provenance and source names (towns, regions, water sources) as a comma-concatenated string. The column is almost entirely empty with a 96% null rate, leaving only 2 distinct values across 50 rows\u2014one populated entry bundling 11 locations together and one blank string. The packed multi-value format suggests this was flattened from a list field rather than a clean categorical.","role":"metadata","scope":"column","target":"origins_fr","treatment":"split on commas and explode into a multi-label set before use; coverage too sparse to model directly."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Short product label field, likely a shelf-name abbreviation including brand, variant and pack size (e.g. 'CRISTALINE Eau De Source 0.5L'). It is almost entirely empty with a null_rate of 0.86, and among the 7 populated rows every value is unique (entropy_ratio 1.0, top_rate ~0.143), so it carries no repeating categories.","role":"free_text","scope":"column","target":"abbreviated_product_name","treatment":"Drop or treat as free text; too sparse and unique to use as a categorical feature."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","n","top_value","top_values","stats.entropy_ratio"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text customer service contact details (postal addresses or URLs) extracted from product packaging, mostly in French. The column is 86% null with only 7 populated rows across 6 near-unique values, and entries are long unstructured strings mixing brands like Wasa, Cristaline, Ferrero, Kellogg's, Nestl\u00e9 and La Boulang\u00e8re.","role":"free_text","scope":"column","target":"customer_service","treatment":"Drop or parse out brand/URL/address fields separately; too sparse and unstructured to model as-is."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.entropy_ratio","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Concatenated provenance trail listing the producers, databases, and apps that contributed to each record (e.g., 'Database - Equadis, Database - GDSN, Databases, Producers, Producer - nestle-france'). 84% of rows are null and the 8 non-null values are all unique, giving entropy_ratio 1.0 \u2014 every observed string is a bespoke composite rather than a clean category. Repeated tokens within a single value (e.g., 'Producers' appearing twice) suggest the field was assembled by concatenation without deduplication.","role":"metadata","scope":"column","target":"data_sources_imported","treatment":"Split on commas and one-hot or multi-hot encode the underlying source tokens rather than using the raw string."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.top_value","stats.top_rate","stats.entropy","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be an error/diagnostic flag explaining why a NOVA food classification group could not be assigned. It is null in 96% of 50 rows, and the only observed value across the 2 non-null cases is \"too_many_unknown_ingredients\" (top_rate 1.0, cardinality 1, entropy 0). With a single category present, the column carries no discriminative signal in this sample.","role":"metadata","scope":"column","target":"nova_group_error","treatment":"Drop or retain only as a boolean error-present flag; near-constant and overwhelmingly null."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be the OCR result of a German ingredients list (ingredients_text_de_ocr) tied to a specific timestamped run. Of 50 rows, 98% are null and only a single non-null value exists \u2014 a detailed Nuss-Nougat-Creme ingredient declaration \u2014 giving cardinality 1 and entropy 0.","role":"free_text","scope":"column","target":"ingredients_text_de_ocr_1648897071_result","treatment":"Drop; 98% null with a single observed value provides no signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Romanian-language packaging text field that is essentially empty: 96% of the 50 rows are null and the remaining 2 non-null values are both blank strings, yielding a single observed category and zero entropy.","role":"free_text","scope":"column","target":"packaging_text_ro","treatment":"Drop; no usable signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"A Romanian-language product name field that is effectively empty: 96% of the 50 rows are null, leaving only 2 non-null values, one of which is an empty string and the other an English phrase ('Sour Cream & Onion'). With cardinality of 2 and no actual Romanian content observed, this column carries no usable signal in the sample.","role":"metadata","scope":"column","target":"product_name_ro","treatment":"Drop; null_rate 0.96 and no Romanian values present."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_values","stats.cardinality","stats.top_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Identifier-style categorical capturing a producer/version reference, but 92% of the 50 rows are null, leaving only 4 populated values. The non-null entries are inconsistent in shape \u2014 a small integer ('1'), an ISO timestamp, and an 8-digit number \u2014 suggesting the field is overloaded or improperly typed. With cardinality 3 and top_rate 0.5 over a tiny populated subset, no reliable signal can be drawn.","role":"metadata","scope":"column","target":"producer_version_id","treatment":"Drop or quarantine until the upstream schema is clarified; not usable as a feature at 92% null with mixed value types."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.entropy_ratio","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Free-text serving size descriptors imported from an upstream source, mixing grams with French unit hints like 'tranche' and 'carr\u00e9s'. 88% of the 50 rows are null and the 6 non-null values are all unique, so entropy_ratio is 1.0 and there is no modal serving. Format is inconsistent (e.g. '30 g' vs '25.6 g (5 carr\u00e9s (25,6 g))'), making direct aggregation unsafe.","role":"free_text","scope":"column","target":"serving_size_imported","treatment":"Parse the leading numeric grams into a numeric column and discard the free-text remainder."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.top_rate","stats.top_value","stats.entropy","top_values","n"],"model":"anthropic:claude-opus-4-7","narrative":"A boolean-style flag indicating whether nutrition data was skipped during import. With a 0.92 null rate and only 4 non-null rows all reading \"false\" (top_rate 1.0, cardinality 1, entropy 0.0), the column carries no information in this sample.","role":"metadata","scope":"column","target":"no_nutrition_data_imported","treatment":"Drop; constant value with overwhelming nulls."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_value","top_rate","top_values","cardinality"],"model":"anthropic:claude-opus-4-7","narrative":"Categorical column capturing imported packaging type, almost certainly free-form labels like 'Enveloppe' or 'Bo\u00eete, Barquette'. It's effectively unusable as-is: 92% of the 50 rows are null, leaving only 4 observed values across 2 distinct categories, with 'Enveloppe' covering 3 of them.","role":"metadata","scope":"column","target":"packaging_imported","treatment":"Drop or set aside until more coverage is available; 92% nulls leave nothing to model."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Romanian-language ingredients text, almost entirely absent in this sample. 96% of the 50 rows are null, and the only 2 non-null values are empty strings, giving cardinality 1 and entropy 0. There is no usable signal here.","role":"free_text","scope":"column","target":"ingredients_text_ro","treatment":"Drop; effectively empty for this sample."},{"confidence":"low","critiques":[],"evidence_keys":["null_rate","n_unique","top_values","stats.top_rate","stats.entropy_ratio"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a sparsely populated categorical field tracking some imported producer version identifier, with 92% null_rate leaving only 4 non-null values across 50 rows. The 3 distinct values are wildly inconsistent in format \u2014 '1', a timestamp '2021-01-25T13:53:49+01:00', and a numeric '44217063' \u2014 suggesting the column conflates multiple semantics or has been mis-mapped during import. With only 4 observations, top_rate of 0.5 and entropy_ratio of 0.95 are not meaningful signals.","role":"metadata","scope":"column","target":"producer_version_id_imported","treatment":"Drop unless the import pipeline can be fixed to emit a single consistent value type."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Imported product labels (likely certifications or dietary tags) carried over from an external source, with values like 'V\u00e9g\u00e9tarien' and comma-separated certification strings ('Point Vert, Rainforest Alliance, Triman'). The column is 90% null, leaving only 5 populated rows across 3 distinct values, and the top value covers 60% of those. With such sparse coverage and multi-label strings packed into single cells, this field is barely usable as-is.","role":"metadata","scope":"column","target":"labels_imported","treatment":"Split comma-separated tags and one-hot encode, but expect to drop given 90% nulls."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be the OCR-extracted German ingredients text from a timestamped scan (1648990410), capturing raw product label text. It is effectively empty: 98% null with only 1 non-null value out of 50 rows, a single German ingredients string for a hazelnut-nougat cookie product. With cardinality 1 and entropy 0, it carries no discriminative signal in this sample.","role":"free_text","scope":"column","target":"ingredients_text_de_ocr_1648990410_result","treatment":"Drop; 98% null and only one observed value provides no usable signal."},{"confidence":"medium","critiques":[],"evidence_keys":["null_rate","n_unique","top_value","top_rate","top_values","entropy_ratio"],"model":"anthropic:claude-opus-4-7","narrative":"Categorical column listing imported allergen declarations, with 90% nulls leaving only 5 populated rows across 4 distinct values. Entries are comma-separated multi-allergen strings in French (e.g., 'Gluten, Graines de s\u00e9same', '\u0152ufs, Gluten'), and one value embeds what looks like a GS1 code ('Gs1:T4078:ML'), suggesting inconsistent encoding. 'Gluten' is the only repeated value (2 of 5), and entropy_ratio of 0.96 reflects the near-uniform spread across the tiny populated subset.","role":"feature","scope":"column","target":"allergens_imported","treatment":"Split on commas into a multi-label allergen set and impute or flag the 90% missing before use."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be an OCR-extracted German ingredients text field (timestamped 1648990410), likely from a food product database such as Open Food Facts. Out of 50 rows, 98% are null and only a single non-null value exists \u2014 a long ingredient string for a hazelnut-nougat cookie product. With cardinality 1 and entropy 0, the column carries no discriminative signal in this sample.","role":"free_text","scope":"column","target":"ingredients_text_de_ocr_1648990410","treatment":"Drop; 98% null and only one unique OCR value provides no modelling signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a German-language OCR extraction of an ingredients list (timestamped 1648897071), likely from Open Food Facts product packaging. The column is essentially empty: 98% null across 50 rows, with only 1 non-null value present, so cardinality is 1 and entropy is 0. The single observed entry is a long free-text ingredients string for a hazelnut-nougat-cream product, with allergens marked by underscores.","role":"free_text","scope":"column","target":"ingredients_text_de_ocr_1648897071","treatment":"Drop; the column is 98% null with only one unique value and carries no signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Romanian-language generic drug name field, but it is effectively empty: 96% of the 50 rows are null, and the only 2 non-null entries are blank strings, giving a cardinality of 1 and entropy of 0. There is no usable signal here.","role":"metadata","scope":"column","target":"generic_name_ro","treatment":"Drop; the column carries no information."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Column 'origin_ro' is effectively empty: 96% of the 50 rows are null, and the only 2 non-null values are blank strings, giving a single observed category with zero entropy. There is no usable signal here.","role":"other","scope":"column","target":"origin_ro","treatment":"Drop; column carries no information."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy_ratio","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a shortened/imported product name field, but it's almost entirely empty: 94% null across 50 rows, leaving only 3 non-null values, each unique (e.g., 'Authentique 275g, fr', 'Fibres 230g, fr', 'DESSERT Noir 205g'). With cardinality equal to the populated count and maximal entropy_ratio of 1.0, there is no repetition to learn from. The mixed formatting and language hints (French abbreviations, weight suffixes) further suggest inconsistent upstream import.","role":"metadata","scope":"column","target":"abbreviated_product_name_imported","treatment":"Drop or defer \u2014 too sparse and near-unique to be useful as a feature."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","cardinality","top_value","top_values","entropy_ratio"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to record allergen trace declarations (in French) on food products, listing items like Lupin, Lait, Moutarde, Soja as comma-separated lists. It is almost entirely empty with a 92% null rate, leaving only 4 non-null values across 50 rows, each unique. With cardinality equal to the populated count, every observed value is its own category, making aggregation unreliable.","role":"free_text","scope":"column","target":"traces_imported","treatment":"Split on commas into a multi-label allergen indicator set, but expect sparse signal given the 92% null rate."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'specific_ingredients' was skipped by the profiler, so no type, uniqueness, or distribution stats are available beyond a row count of 50 and a null rate of 0.0. The name suggests it holds ingredient lists, likely free text or arrays, which is consistent with the profiler declining to summarise it. Without sample values or cardinality we cannot confirm structure or detect duplicates, language mix, or skew.","role":"free_text","scope":"column","target":"specific_ingredients","treatment":"Inspect raw values and parse or tokenize before any modelling."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_values","stats.top_value","stats.top_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Russian-language product name field, almost entirely absent: 94% of the 50 rows are null and only 2 distinct non-null values appear, one of which is an empty string. The single real value observed is '\u042d\u043a\u0441e\u043b\u0435\u043d\u0441 99% \u043a\u0430\u043a\u0430\u043e', suggesting this column is a sparsely populated localization of a product name.","role":"metadata","scope":"column","target":"product_name_ru","treatment":"Drop or defer; too sparse (94% null) to use as a feature."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"A categorical column flagged as Russian-origin metadata, but it is effectively empty: 94% of the 50 rows are null and the only non-null value observed is the empty string, repeated 3 times. Cardinality is 1 and entropy is 0, so this column carries no information as-is.","role":"metadata","scope":"column","target":"origin_ru","treatment":"Drop; the column has a single empty value and 94% nulls."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Russian-language ingredient text with allergen markup, almost entirely absent from this sample. 94% of rows are null and the remaining 6% are all empty strings, leaving a single unique value and zero entropy.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_ru","treatment":"Drop; no usable signal in this sample."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Russian-language packaging text field that is effectively empty: 94% of 50 rows are null and the remaining 3 non-null entries are all the empty string, giving a single observed value and zero entropy. There is no usable signal here.","role":"free_text","scope":"column","target":"packaging_text_ru","treatment":"Drop; column is 94% null with the only non-null value being an empty string."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_values","stats.top_value","stats.top_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Russian-language generic product name field, populated for only 3 of 50 rows (null_rate 0.94). Among the 3 non-null entries, 2 are empty strings and 1 is '\u041f\u043b\u0438\u0442\u043a\u0430 \u0433\u043e\u0440\u044c\u043a\u043e\u0433\u043e \u0448\u043e\u043a\u043e\u043b\u0430\u0434\u0430 (99% \u043a\u0430\u043a\u0430\u043e)', so effectively only one real value is present. The column is unusable as a feature at this sample size.","role":"metadata","scope":"column","target":"generic_name_ru","treatment":"Drop or hold aside until coverage improves; do not use for modelling."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"Russian-language ingredient text from what appears to be a multilingual product catalog. The column is effectively empty: 94% null and the only 3 non-null entries are blank strings, giving cardinality 1 and zero entropy.","role":"free_text","scope":"column","target":"ingredients_text_ru","treatment":"Drop; no usable signal at this sample size."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Danish-language ingredients text for food products, evidently sourced from Open Food Facts-style multilingual labeling. The column is almost entirely empty (null_rate 0.96), with only 2 non-null values out of 50, one of which is a blank string. The single substantive entry is actually a mixed Swedish/Danish/Norwegian ingredient list with allergen tokens marked by underscores, suggesting the locale tagging is unreliable.","role":"free_text","scope":"column","target":"ingredients_text_da","treatment":"Drop unless modelling Danish text specifically; coverage is too sparse to be useful."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","n","top_value","top_values","stats.cardinality"],"model":"anthropic:claude-opus-4-7","narrative":"Danish-language ingredients text with HTML-tagged allergen spans, evidently sourced from a multilingual food product database. The column is 96% null with only 2 non-null values out of 50, one of which is an empty string, leaving effectively a single real entry that mixes Swedish and Danish/Norwegian terms.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_da","treatment":"Drop unless Danish-specific allergen extraction is required; coverage is too sparse to model."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","top_values","stats.top_rate","stats.cardinality"],"model":"anthropic:claude-opus-4-7","narrative":"Danish product name field with only 2 non-null values out of 50 rows (null_rate 0.96), each appearing once. The two observed labels (\"Original\", \"Alpine Milk\") look like product variant descriptors rather than full product names. With 96% missingness the column carries almost no signal as-is.","role":"metadata","scope":"column","target":"product_name_da","treatment":"Drop or defer until backfilled; 96% nulls make it unusable for modelling."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Danish-language packaging text field that is effectively empty: 96% of the 50 rows are null, and the only 2 non-null values are empty strings, giving cardinality 1 and zero entropy. There is no usable signal here.","role":"free_text","scope":"column","target":"packaging_text_da","treatment":"Drop; column is empty in this sample."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_values","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"Danish-language generic product name field, almost entirely empty: 96% null across 50 rows, leaving only 2 non-null observations. The two surviving values are 'Kiks' and an empty string, so there is essentially no usable signal here.","role":"metadata","scope":"column","target":"generic_name_da","treatment":"Drop; null rate too high to be useful."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'forest_footprint_data' was skipped by the profiler, so its kind is unknown and no descriptive statistics are available. The only confirmed signals are 50 rows with a 0.0 null rate; uniqueness, type, and value distribution are all missing.","role":"other","scope":"column","target":"forest_footprint_data","treatment":"Re-profile or manually inspect this column before any downstream use."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"The column appears to be an origin date or destination identifier ('origin_da') but is effectively empty: 96% of the 50 rows are null and the only observed value is the empty string, which accounts for the remaining 2 entries. With cardinality of 1 and entropy of 0, it carries no information.","role":"metadata","scope":"column","target":"origin_da","treatment":"Drop; the column has no usable signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a source/origin categorical field, but it is effectively empty: 96% of the 50 rows are null and the only 2 non-null values are blank strings, giving a single observed category with entropy 0. There is no usable signal here.","role":"metadata","scope":"column","target":"origin_sr","treatment":"Drop; column is 96% null with only blank values."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","n","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to hold OCR-extracted Dutch ingredient text from product packaging, likely a per-image result field. It is 98% null with only one non-null value present ('Cacaomassa, suiker, cacaoboter, natuurlijk Bourbon vanille - stokje.'), giving cardinality 1 and zero entropy. With effectively no variance or coverage, it carries no analytical signal in this sample.","role":"free_text","scope":"column","target":"ingredients_text_nl_ocr_1675675383_result","treatment":"Drop; near-empty with a single observed value."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","top_values","stats.top_value","stats.top_rate","n"],"model":"anthropic:claude-opus-4-7","narrative":"Czech-language ingredients text, almost entirely absent: 94% of the 50 rows are null and only 2 distinct non-null values exist, one of which is an empty string appearing twice. The single substantive entry is a Czech ingredients list (\"Kakaov\u00e1 hmota, cukr, kakaov\u00e9 m\u00e1slo, vanilka.\"), confirming this is a localized free-text field rather than a categorical feature.","role":"free_text","scope":"column","target":"ingredients_text_cs","treatment":"Drop for modelling; retain only if Czech-localized text is specifically needed."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Czech-localised product name field (`product_name_cs`) that is almost entirely unpopulated: 94% of the 50 rows are null and only 2 distinct values appear, one of which is an empty string. The single real label observed is an English-language entry (\"Excellence 70% Cocoa Intense Dark\"), suggesting the Czech translation pipeline has not been applied.","role":"metadata","scope":"column","target":"product_name_cs","treatment":"Drop unless Czech localisation is required; the column is 94% null and effectively empty."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"A categorical field 'origin_hu' that is 92% null and, among the 4 non-null rows, contains only the empty string. Effective cardinality is 1 with zero entropy, so the column carries no information in this sample.","role":"metadata","scope":"column","target":"origin_hu","treatment":"Drop; the column is constant and almost entirely null."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values","n"],"model":"anthropic:claude-opus-4-7","narrative":"Hungarian packaging text field that is effectively empty: 92% null and the only non-null value across 50 rows is the empty string, occurring 4 times. Cardinality is 1 with entropy 0, so the column carries no information.","role":"metadata","scope":"column","target":"packaging_text_hu","treatment":"Drop; no signal (single empty value, 92% null)."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values","n","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be an origin call-sign or code field, but it is effectively empty: 96% of the 50 rows are null and the only non-null entries are blank strings. With cardinality of 1 and entropy of 0, the column carries no information.","role":"metadata","scope":"column","target":"origin_cs","treatment":"Drop; the column is 96% null with a single blank value otherwise."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","cardinality","top_values","top_value","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Hungarian-language ingredient lists with inline HTML <span class=\"allergen\"> markup highlighting allergens, drawn from what looks like a food-product catalogue (Open Food Facts style). The column is almost entirely empty (null_rate 0.94) \u2014 only 3 of 50 rows are populated, and each of those values is unique. Notable surprise: at least one entry is multilingual, bundling Hungarian, Romanian and Bulgarian label text into a single cell.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_hu","treatment":"Strip HTML tags and treat as optional free text; too sparse (94% null) to use as a feature without heavy imputation."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Czech-localized generic drug name field, but it carries virtually no information in this sample. 94% of rows are null, and the only 1 distinct non-null value is itself an empty string (3 occurrences), giving entropy of 0.0 and a top_rate of 1.0.","role":"metadata","scope":"column","target":"generic_name_cs","treatment":"Drop; column is effectively empty (94% null and only blank values otherwise)."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","top_rate","top_value","top_values","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Hungarian-language ingredient declarations for food products, mirroring Open Food Facts' per-language ingredients_text fields. The column is 92% null with only 4 distinct values across 50 rows, and one of those is an empty string while another is a multi-language label dump (HU/RO/BG) rather than pure Hungarian. Top value frequency is just 0.25, so there is no real mode to lean on.","role":"free_text","scope":"column","target":"ingredients_text_hu","treatment":"Treat as sparse free text; drop or language-filter before any NLP, and don't use as a feature without imputing the 92% missing."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_values","stats.top_value","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"Serbian-language ingredient list field (likely a localized variant of an ingredients_text column). Out of 50 rows, only 2 are populated (null_rate 0.96), and one of those is an empty string, leaving exactly one substantive value. There is essentially no signal here at this sample size.","role":"free_text","scope":"column","target":"ingredients_text_sr","treatment":"Drop unless analysis is restricted to Serbian-localized rows; otherwise too sparse to use."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Serbian-language packaging text field, but it is effectively empty in the sample: 96% of 50 rows are null and the only non-null entries are blank strings, giving cardinality of 1 and entropy of 0. There is no usable signal here.","role":"free_text","scope":"column","target":"packaging_text_sr","treatment":"Drop the column; it carries no information in this sample."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to be Dutch-language OCR-extracted ingredient text from product packaging, likely a sparsely populated language variant of an ingredients field. Out of 50 rows, 98% are null and the single non-null value is a chocolate ingredients list ('Cacaomassa, suiker, cacaoboter, natuurlijk Bourbon vanille- stokje.'). With cardinality of 1 and entropy of 0, this column carries effectively no signal in this sample.","role":"free_text","scope":"column","target":"ingredients_text_nl_ocr_1675675383","treatment":"Drop; 98% null with a single observed value provides no usable signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Czech-language ingredient list with allergen annotations for food products. With a 98% null rate and only 1 non-null value across 50 rows ('Kakaov\u00e1 hmota, cukr, kakaov\u00e9 m\u00e1slo, vanilka.'), the column carries virtually no information in this sample. Entropy is 0.0 and cardinality is 1, so it cannot discriminate between records as-is.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_cs","treatment":"Drop for modelling; revisit only if a larger sample provides meaningful coverage."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_values","stats.top_value","stats.cardinality","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Serbian-language generic product name field (generic_name_sr), likely a localized label in a multilingual product catalog. It is almost entirely empty: 96% null across 50 rows, with only 2 distinct values observed, one of which is itself a blank string. The single non-empty entry is 'Tamna \u010dokolada sa 70% kakaa', so this column carries virtually no usable signal in this sample.","role":"metadata","scope":"column","target":"generic_name_sr","treatment":"Drop or ignore for modelling; retain only if a Serbian-locale view is required."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values","n"],"model":"anthropic:claude-opus-4-7","narrative":"Czech-language packaging text field that is effectively empty: 94% null and the only non-null value observed (3 rows) is itself an empty string, giving cardinality 1 and entropy 0. There is no usable signal here in this sample.","role":"free_text","scope":"column","target":"packaging_text_cs","treatment":"Drop; column is constant-empty with 94% nulls."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_values","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This looks like a Serbian-localized product name field, but it is effectively empty: 96% of the 50 rows are null and only 2 distinct non-null values appear, one in English ('Excellence 70% Cocoa Intense Dark') and one in Cyrillic ('\u0422\u0435\u0447\u0435\u043d \u0428\u043e\u043a\u043e\u043b\u0430\u0434 \u041d\u0443\u0442\u0435\u043b\u0430'). The language mix between Latin English and Cyrillic Serbian is notable for a column nominally tagged 'sr'.","role":"metadata","scope":"column","target":"product_name_sr","treatment":"Drop or defer until coverage improves; with 96% nulls and 2 unique values it carries no modelling signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be the OCR-extracted Hungarian ingredients text for a single product (likely chocolate: cocoa mass, sugar, cocoa butter, vanilla), captured from one timestamped scan. With null_rate 0.98 and only 1 unique non-null value across n=50, this column is effectively empty and carries no comparative signal. The single populated row repeats verbatim, so cardinality and entropy are both at floor.","role":"free_text","scope":"column","target":"ingredients_text_hu_ocr_1571428260_result","treatment":"Drop; 98% null with a single OCR string offers no modelling value."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.top_value","stats.top_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Hungarian-language OCR extraction of an ingredients list (likely from a chocolate product, mentioning cocoa mass, sugar, cocoa butter, and bourbon vanilla). Of 50 rows, 98% are null and only 1 non-null value exists, so the column is effectively empty. The single populated entry is free-text in Hungarian, not a category, despite being typed as categorical.","role":"free_text","scope":"column","target":"ingredients_text_hu_ocr_1571428260","treatment":"Drop; 98% null with a single Hungarian free-text value carries no usable signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Hungarian generic-name field that is almost entirely missing: 92% of the 50 rows are null, and of the 4 non-null entries, 3 are empty strings and only 1 carries a value (\"Finom\"). With cardinality of 2 and a top_rate of 0.75 on the empty string, this column carries virtually no usable signal in the sample.","role":"metadata","scope":"column","target":"generic_name_hu","treatment":"Drop unless a fuller source can be joined in; current null rate makes it unusable."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_values","stats.top_value","stats.top_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Hungarian-language product name field that is effectively empty: 92% of the 50 rows are null, and the only 4 non-null entries collapse to 3 distinct strings (one of which is the empty string, appearing twice). The two actual values present (\"Excellence 70% Cocoa Intense Dark\", \"Dark Chocolate 70% Cacao\") are in English, not Hungarian, suggesting the localisation pipeline never populated this column.","role":"metadata","scope":"column","target":"product_name_hu","treatment":"Drop; null_rate 0.92 and no genuine Hungarian content make it unusable."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_values","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"Serbian-language ingredients list with allergen annotations, populated for only 2 of 50 rows (null_rate 0.96). Of the two non-null entries, one is an empty string and the other is a chocolate ingredient list, leaving effectively a single usable value. Coverage is too sparse to support any aggregate analysis.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_sr","treatment":"Drop or defer; coverage is 4% and insufficient for modelling."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be the result of an OCR pass extracting Spanish ingredient text, with the timestamped name suggesting it's one run among many. Of 50 rows, 98% are null and the single non-null value is a Spanish chocolate ingredients list (cocoa paste, sugar, cocoa butter, sunflower lecithin E-322, vanilla extract, 70% cocoa minimum). With cardinality of 1 and entropy 0, this column carries essentially no information across the dataset.","role":"free_text","scope":"column","target":"ingredients_text_es_ocr_1548767061_result","treatment":"drop; 98% null with only one distinct OCR result provides no modelling signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"A categorical field, likely a localized product name (suffix _xx suggests a translation/locale variant). It is effectively empty: 96% null and the only 2 non-null rows contain the empty string, giving cardinality 1 and zero entropy.","role":"metadata","scope":"column","target":"product_name_xx","treatment":"Drop; the column carries no signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a localized generic name field (suffix _xx suggests a translation/locale variant), but it is effectively empty: 96% of the 50 rows are null, and the only 2 non-null values are blank strings. Cardinality is 1 with zero entropy, so the column carries no information.","role":"metadata","scope":"column","target":"generic_name_xx","treatment":"Drop; null_rate 0.96 and single empty value provide no signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Spanish-language OCR capture of an ingredients list (likely from a chocolate product label, given 'Pasta de cacao' and '70% m\u00ednimo'). It is effectively empty: 98% null across 50 rows, with the single non-null value being one verbatim ingredients string. There is no analytical signal here \u2014 entropy is 0 and cardinality is 1.","role":"free_text","scope":"column","target":"ingredients_text_es_ocr_1548767061","treatment":"Drop; 98% null with only one observed value."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a localized ingredients text field (suffix _xx suggests a placeholder or unknown locale variant). It is effectively empty: 96% of the 50 rows are null, and the only 2 non-null entries are both empty strings, giving cardinality 1 and entropy 0.","role":"free_text","scope":"column","target":"ingredients_text_xx","treatment":"Drop; the column carries no information."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'origin_xx' is effectively empty: 98% of its 50 rows are null, and the single non-null value is itself an empty string, giving a cardinality of 1 and entropy of 0. There is no usable signal here.","role":"other","scope":"column","target":"origin_xx","treatment":"Drop the column; it carries no information."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a localized packaging text field (xx language suffix) that is essentially empty in this sample. 98% of rows are null and the single non-null value is itself an empty string, leaving zero effective cardinality and zero entropy.","role":"metadata","scope":"column","target":"packaging_text_xx","treatment":"Drop; the column carries no usable signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values","n","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"Likely an Urdu-language ingredient text field (ingredients_text_ur), almost entirely absent from this sample. 98% of rows are null, and the single non-null value is an empty string, leaving zero usable content. Cardinality is 1 with entropy 0.0, so the column carries no information here.","role":"free_text","scope":"column","target":"ingredients_text_ur","treatment":"Drop from modelling; retain only if a fuller multilingual extract becomes available."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be an Urdu-language product name field that is essentially empty: 98% of the 50 rows are null, and the single non-null value is itself an empty string. Cardinality collapses to 1 and entropy is 0, so the column carries no information as captured.","role":"metadata","scope":"column","target":"product_name_ur","treatment":"Drop; column is effectively empty with zero entropy."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Column 'origin_he' is effectively empty: 98% of the 50 rows are null and the only observed value is the empty string, giving a cardinality of 1 and entropy of 0. There is no usable signal here.","role":"metadata","scope":"column","target":"origin_he","treatment":"Drop; column carries no information."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","top_values","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"Hebrew product name field that is almost entirely empty \u2014 96% null across 50 rows, leaving only 2 non-null values, both unique (\u05e0\u05d5\u05d8\u05dc\u05d4 and \u05ea\u05e4\u05d5\u05e6\u05d9\u05e4\u05e1 \u05e9\u05de\u05e0\u05ea \u05d1\u05e6\u05dc). With just two observations the entropy ratio of 1.0 is meaningless, and the column cannot support any analysis in its current state.","role":"metadata","scope":"column","target":"product_name_he","treatment":"Drop or defer until backfilled; 96% null makes it unusable downstream."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'origin_ur' appears to be a near-empty metadata or URL-like field, with 98% nulls across 50 rows and only 1 non-null value, which is itself an empty string. Cardinality is 1 and entropy is 0, so the column carries no information as captured. The truncated name ('origin_ur', likely 'origin_url') and total absence of real values suggest a broken or unused field.","role":"metadata","scope":"column","target":"origin_ur","treatment":"Drop; column has 98% nulls and a single empty-string value, providing no signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be an Urdu-language generic name field, likely a localized translation of a drug or product's generic name. It is effectively empty: 98% of the 50 rows are null, and the single non-null value is itself an empty string, giving cardinality 1 and entropy 0. There is no usable signal here.","role":"metadata","scope":"column","target":"generic_name_ur","treatment":"Drop the column; it is 98% null with the only present value being blank."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Hebrew packaging text field that is essentially empty: 98% of the 50 rows are null and the single non-null observation is itself an empty string, leaving cardinality at 1 and entropy at 0. There is no usable signal here for any downstream task.","role":"free_text","scope":"column","target":"packaging_text_he","treatment":"Drop the column; it carries no information."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Hebrew-language ingredient text field, almost entirely absent from this sample. 98% of the 50 rows are null, and the single non-null value is an empty string, leaving cardinality at 1 and entropy at 0.","role":"free_text","scope":"column","target":"ingredients_text_he","treatment":"Drop; no usable signal at this sample size."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"Likely an Urdu-language packaging text field, but it carries essentially no information here: 98% of rows are null and the only non-null value observed is an empty string. Cardinality is 1 with entropy 0.0, so the column is constant across the populated rows.","role":"free_text","scope":"column","target":"packaging_text_ur","treatment":"Drop; effectively empty with 98% nulls and a single empty-string value."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"Hebrew generic drug name field, but it is effectively empty: 98% null across 50 rows, leaving a single non-null value (a Hebrew product description) that occupies 100% of the observed entries. Cardinality is 1 and entropy is 0, so the column carries no discriminating signal in this sample.","role":"metadata","scope":"column","target":"generic_name_he","treatment":"Drop from modelling; revisit only if a fuller extract populates the field."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate"],"model":"anthropic:claude-opus-4-7","narrative":"Hebrew-localized ingredients-with-allergens text, almost entirely absent: 98% null across 50 rows and the single non-null value is an empty string. Cardinality is 1 with zero entropy, so this column carries no information in this sample.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_he","treatment":"Drop; no usable signal in this sample."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","top_values","stats.entropy","stats.top_value","n"],"model":"anthropic:claude-opus-4-7","narrative":"Producer-supplied Nutri-Score letter grade (a\u2013e scale), captured here as three distinct values: 'c', 'e', and 'b', each appearing once. The column is essentially empty, with a 94% null rate leaving only 3 of 50 rows populated, so the apparent uniform entropy (1.58) is an artefact of tiny sample size. No 'a' or 'd' grades observed in the evidence.","role":"feature","scope":"column","target":"nutriscore_grade_producer","treatment":"Drop or defer; too sparse (94% null) to use until producer coverage improves."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","top_values","stats.cardinality"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Nutri-Score grade (a-e scale) imported from producer data, stored as a categorical letter grade. The column is almost entirely empty with a 94% null rate, leaving only 3 non-null values across 3 distinct grades (c, e, b) \u2014 too sparse to draw any distributional conclusions.","role":"feature","scope":"column","target":"nutriscore_grade_producer_imported","treatment":"Drop or treat as missing-indicator only; too sparse (94% null) to use as a feature."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","n","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be Greek-language packaging text, but it's effectively empty: 98% of the 50 rows are null, and the single non-null value is itself an empty string. Cardinality is 1 with zero entropy, meaning there is no usable signal here whatsoever.","role":"free_text","scope":"column","target":"packaging_text_el","treatment":"Drop the column; it has no observed content."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values","n"],"model":"anthropic:claude-opus-4-7","narrative":"Greek-language ingredients-with-allergens text field that is effectively empty in this sample: 98% null and the only non-null value observed is itself an empty string. With cardinality of 1 and entropy 0, this column carries no signal here.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_el","treatment":"Drop; no usable content in this sample."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This is the Greek-language ingredients text field, presumably from a multilingual food product dataset. It is effectively empty: 98% null across 50 rows, and the single non-null value is itself an empty string, leaving cardinality at 1 and entropy at 0.","role":"free_text","scope":"column","target":"ingredients_text_el","treatment":"Drop; no usable signal at this sample size."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Greek-language generic name field that is effectively empty: 98% nulls and the only observed non-null value is itself an empty string, giving a single unique entry across 50 rows. Entropy is 0.0 and top_rate is 1.0, so the column carries no information in this sample.","role":"metadata","scope":"column","target":"generic_name_el","treatment":"Drop; the column has no usable signal here."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'origin_el' is nearly entirely empty: 98% of the 50 rows are null, and the single non-null value is itself an empty string, leaving cardinality at 1 and entropy at 0. There is no usable signal here whatsoever.","role":"other","scope":"column","target":"origin_el","treatment":"Drop the column; it is effectively all null with no variance."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Greek-language product name field that is effectively empty in this sample. 98% of rows are null and the single non-null value is itself an empty string, giving cardinality 1 and zero entropy. There is no usable signal here at n=50.","role":"metadata","scope":"column","target":"product_name_el","treatment":"Drop from modelling; revisit only if a larger sample shows actual Greek text."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Thai-language generic drug name field that is effectively empty in this sample: 98% of 50 rows are null and the only non-null value observed is the empty string, giving a single distinct value and zero entropy.","role":"metadata","scope":"column","target":"generic_name_th","treatment":"Drop from modelling; the column carries no information in this slice."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to hold the OCR result of a German ingredients text extraction (likely from a product label image), with a timestamp embedded in the column name. Of 50 rows, 98% are null and only one non-null value exists \u2014 a single German cocoa-product ingredient list mentioning possible traces of nuts, milk, and soy. With cardinality 1 and entropy 0, the column carries effectively no signal at this sample size.","role":"free_text","scope":"column","target":"ingredients_text_de_ocr_1559410715_result","treatment":"Drop; 98% null and only one distinct OCR string provides no usable signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy_ratio","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Thai-localized ingredients-with-allergens text field, but it is effectively empty: 98% of 50 rows are null and the single populated row contains an English-language ingredients string for a 99% cocoa product. The column carries zero entropy (entropy_ratio 0.0) and only one distinct value, so it provides no analytical signal. The language mismatch (English content in a _th column) is also notable.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_th","treatment":"Drop; 98% null and a single non-Thai value make it unusable."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Thai-language packaging text field, but it is effectively empty: 98% of the 50 rows are null, and the single non-null value is itself an empty string. Cardinality is 1 with zero entropy, so the column carries no information.","role":"free_text","scope":"column","target":"packaging_text_th","treatment":"Drop; no usable signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","n","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"Thai-language product name field, almost entirely empty: 98% null across 50 rows with only a single non-null value (one Lindt dark chocolate entry). Cardinality is 1 and entropy is 0, so this column carries no discriminating signal in this sample.","role":"metadata","scope":"column","target":"product_name_th","treatment":"Drop from modelling; revisit only if a fuller Thai-localised dump becomes available."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to hold the OCR result of a German ingredients label (one specific dark chocolate product) tied to a timestamped run (1548767354). Of 50 rows, 98% are null and the single non-null value occupies the entire observed cardinality of 1, giving zero entropy. There is effectively no variation to learn from here.","role":"free_text","scope":"column","target":"ingredients_text_de_ocr_1548767354_result","treatment":"Drop; 98% null and only one distinct OCR string."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","cardinality","entropy","top_value","top_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This is a Thai-language ingredients text field (ingredients_text_th), but 98% of the 50 rows are null and the single non-null entry is actually English text describing cocoa-based product ingredients. With cardinality of 1 and entropy of 0, the column carries no usable signal and the one populated value appears to be in the wrong language for the field.","role":"free_text","scope":"column","target":"ingredients_text_th","treatment":"Drop; 98% null and the lone value is mislocalized."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Column 'origin_th' is effectively empty: 98% of the 50 rows are null and the only observed non-null value is itself an empty string, giving a cardinality of 1 and entropy of 0. There is no signal here to model or join on.","role":"other","scope":"column","target":"origin_th","treatment":"Drop; the column is 98% null with a single empty-string value otherwise."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","cardinality","entropy","top_value","top_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be German-language OCR text of product ingredient lists, likely from a food database (the sole observed value describes dark chocolate ingredients). The column is almost entirely empty with a 0.98 null rate, and only one non-null record exists across 50 rows, yielding cardinality 1 and entropy 0. With a single observation there is no usable variation for analysis.","role":"free_text","scope":"column","target":"ingredients_text_de_ocr_1548767354","treatment":"Drop; 98% null with only one observed value provides no signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a German-language OCR extraction of an ingredients list (likely from a chocolate product packaging), captured as free text. It is almost entirely empty with a 0.98 null rate, and the single non-null row contains one verbose ingredient declaration, giving cardinality 1 and entropy 0.0. With only one observed value out of 50 rows, this column carries no usable signal as-is.","role":"free_text","scope":"column","target":"ingredients_text_de_ocr_1559410715","treatment":"Drop; effectively empty (98% null, single distinct OCR string)."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be an Italian-language OCR extraction of an ingredients list, likely from a food product label (the lone value describes 99% dark chocolate). The column is effectively empty: 98% null across 50 rows, with only a single non-null value, giving cardinality 1 and entropy 0. There is no variation to learn from here.","role":"free_text","scope":"column","target":"ingredients_text_it_ocr_1559410715","treatment":"Drop; 98% null with a single observed value carries no signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to hold OCR-extracted Italian ingredient text (timestamp-suffixed name suggests a single OCR pass result). It is effectively empty: 98% null across n=50, with only one non-null value \u2014 a chocolate ingredient list \u2014 giving cardinality 1 and zero entropy.","role":"free_text","scope":"column","target":"ingredients_text_it_ocr_1559410715_result","treatment":"Drop; a single non-null OCR string carries no modelling signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","cardinality","top_value","top_rate","n"],"model":"anthropic:claude-opus-4-7","narrative":"Likely a French-language packaging description imported from an external source (e.g., Open Food Facts), describing recycling instructions for components. The column is 98% null and only a single non-null value appears across 50 rows, so it carries no analytical signal in this sample.","role":"free_text","scope":"column","target":"packaging_text_fr_imported","treatment":"Drop; near-entirely null with no variance."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a French-language preparation/readiness label imported from an external source, indicating how a product is prepared. It is effectively unusable here: 98% of the 50 rows are null, and the single non-null value is \"Produit pr\u00eat \u00e0 consommer\", giving cardinality 1 and entropy 0.","role":"metadata","scope":"column","target":"preparation_fr_imported","treatment":"Drop; near-entirely null with a single constant value carries no signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"A categorical preparation field, likely indicating how a food product should be prepared before consumption. It is effectively empty: 98% of the 50 rows are null, leaving only a single observed value (\"Produit pr\u00eat \u00e0 consommer\") with cardinality 1 and zero entropy. With no variation among the populated rows, the column carries no discriminative signal.","role":"metadata","scope":"column","target":"preparation","treatment":"Drop; 98% null and only one observed value."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a French-language preparation instruction field, likely metadata describing how a product is consumed. It is essentially empty: 98% of the 50 rows are null, and the single non-null value is \"Produit pr\u00eat \u00e0 consommer\", giving cardinality 1 and entropy 0. There is no variation to learn from in this sample.","role":"metadata","scope":"column","target":"preparation_fr","treatment":"Drop; 98% null with only one observed value provides no signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a lowercased ingredients text field, likely derived from a product or recipe source. It is effectively empty: 98% of the 50 rows are null, and the single non-null value is itself an empty string, giving cardinality 1 and entropy 0. There is no usable signal here.","role":"free_text","scope":"column","target":"ingredients_text_lc","treatment":"Drop; the column is 98% null and the only observed value is empty."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"A lowercased product name field that is effectively empty: 98% of the 50 rows are null and the single non-null value is also an empty string, giving a cardinality of 1 and entropy of 0. There is no usable signal here.","role":"feature","scope":"column","target":"product_name_lc","treatment":"Drop; column is 98% null with the only observed value being an empty string."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"Almost certainly a normalised lowercase ingredients-with-allergens text field, but in this sample it carries no signal: 98% of rows are null and the single non-null value is an empty string. With cardinality 1 and entropy 0, there is nothing to learn from this column as-is.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_lc","treatment":"Drop from the working set unless a larger sample shows real text content."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values","n","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a lowercased generic drug name field, but it is effectively empty in this sample: 98% null and the only non-null value among 50 rows is an empty string. With cardinality of 1 and entropy of 0, the column carries no information here.","role":"feature","scope":"column","target":"generic_name_lc","treatment":"Drop; no signal at this null rate and cardinality."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column is flagged as unknown kind with all profiling skipped, so saturn produced no statistics beyond a 50-row count and zero nulls. The name suggests it holds debug tags attached to multilingual (xx) ingredient text, likely a list or structured field the profiler could not parse. Without unique counts, value samples, or type information there is nothing further to characterise.","role":"metadata","scope":"column","target":"ingredients_text_xx_debug_tags","treatment":"Inspect raw values manually; drop unless debug tags are needed downstream."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","stats"],"model":"anthropic:claude-opus-4-7","narrative":"This column was skipped by the profiler, so its kind is unknown and no descriptive statistics are available beyond a row count of 50 and a null rate of 0.0. The name suggests it holds debug tags attached to localized product names (the 'xx' locale and 'debug_tags' suffix), which is typically engineering scaffolding rather than analytical signal. Without unique counts or value samples, nothing can be said about cardinality or content.","role":"metadata","scope":"column","target":"product_name_xx_debug_tags","treatment":"Drop unless a downstream debugging workflow specifically needs it."},{"confidence":"low","critiques":[],"evidence_keys":["alerts","kind","n","null_rate","column"],"model":"anthropic:claude-opus-4-7","narrative":"This column is flagged as kind 'unknown' and was skipped by the profiler, so no statistics were computed beyond a row count of 50 and a null rate of 0.0. The name suggests it holds debug tags associated with a generic name field, likely diagnostic metadata rather than analytical signal. Without unique counts or value samples, nothing further can be inferred.","role":"metadata","scope":"column","target":"generic_name_xx_debug_tags","treatment":"Drop unless debug tags are explicitly needed for tracing."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","n","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a French-language OCR capture of an ingredients list, timestamped in the column name (1561814324). With null_rate of 0.98, only a single non-null row exists out of 50, and that lone value is a full ingredients paragraph\u2014cardinality is 1 and entropy is 0. There is effectively no signal here for analysis.","role":"free_text","scope":"column","target":"ingredients_text_fr_ocr_1561814324","treatment":"Drop; 98% null with a single observed value provides no usable signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be the OCR result of a French ingredients label, captured at a specific timestamp (1561814324) suggesting it's one of many time-stamped OCR snapshot columns. Of 50 rows, 98% are null and only a single non-null value exists \u2014 a verbose French ingredients string for a nut-and-raisin mix. With cardinality 1 and entropy 0, the column carries essentially no analytical signal in this sample.","role":"free_text","scope":"column","target":"ingredients_text_fr_ocr_1561814324_result","treatment":"Drop; 98% null and only one distinct OCR string provides no usable signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to hold OCR results of French ingredient lists, likely from a timestamped extraction run (1624039072). It is effectively empty: 98% null with only 1 non-null value out of 50, that single entry being a cocoa/soy lecithin/vanilla ingredient string. With cardinality 1 and entropy 0, the column carries no usable signal in this sample.","role":"free_text","scope":"column","target":"ingredients_text_fr_ocr_1624039072_result","treatment":"Drop; 98% null with a single observed value provides no modelling signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be French OCR-extracted ingredient text from product packaging, with the timestamp suffix suggesting a dated extraction run. Out of 50 rows, 98% are null and only a single non-null value exists ('ingr\u00e9dients : cacao, \u00e9mulsifiant (l\u00e9cithine de _soja_), vanille.'), giving cardinality 1 and zero entropy. The column is effectively empty and carries no discriminative signal.","role":"free_text","scope":"column","target":"ingredients_text_fr_ocr_1624039072","treatment":"Drop; 98% null with a single observed value provides no usable signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a French-language OCR-extracted ingredients list (likely from a food product label, given mentions of flour, sugar, butter, eggs, and emulsifiers). Out of 50 rows, 98% are null and only a single non-null value exists, giving cardinality 1 and entropy 0. The column is effectively empty and carries no discriminative signal in this sample.","role":"free_text","scope":"column","target":"ingredients_text_fr_ocr_1573108346","treatment":"Drop; 98% null with a single observed value provides no usable signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be the OCR-extracted French ingredients text from a single product image (timestamped 1566920858), holding raw label transcriptions. The column is effectively empty: 98% null across n=50, with only one non-null value \u2014 a single French ingredient list for a butter/egg pastry product. Cardinality is 1 and entropy is 0, so it carries no discriminative signal in this sample.","role":"free_text","scope":"column","target":"ingredients_text_fr_ocr_1566920858_result","treatment":"Drop; 98% null and only one unique OCR string provides no modelling signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This is a French OCR-extracted ingredients list, almost certainly a timestamped snapshot column from an Open Food Facts-style export. The column is effectively empty: 98% null across 50 rows, with only a single non-null value present, so cardinality is 1 and entropy is 0. The lone observation is a long free-text French ingredients string, not a category, despite being typed as categorical.","role":"free_text","scope":"column","target":"ingredients_text_fr_ocr_1573107556","treatment":"Drop; a single non-null value at 98% null rate carries no signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be the OCR-extracted French ingredients text from a specific scan run (timestamped 1573108346), holding raw label transcriptions like a bakery product's flour/sugar/butter list. Out of 50 rows, 98% are null and the single populated value is one long French ingredient string, giving cardinality 1 and entropy 0. The column is effectively empty for analytical purposes.","role":"free_text","scope":"column","target":"ingredients_text_fr_ocr_1573108346_result","treatment":"Drop; 98% null with only one populated OCR string offers no signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to hold the OCR-extracted French ingredients text from a product image (timestamp 1573107560 in the name suggests a single OCR run). Of 50 rows, 98% are null and only 1 unique value exists \u2014 a single French ingredient list for what looks like a butter/egg pastry. With cardinality 1 and entropy 0, this column carries no discriminative signal in this sample.","role":"free_text","scope":"column","target":"ingredients_text_fr_ocr_1573107560_result","treatment":"Drop or defer \u2014 98% null and a single observed value provide no usable signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to hold the OCR-extracted French ingredients text for a product, tied to a specific OCR run timestamp (1573108349). It is essentially empty: 98% null across 50 rows, with only a single non-null value \u2014 a long French ingredients string for what looks like a butter/egg pastry. With cardinality 1 and entropy 0, it carries no discriminative signal in this sample.","role":"free_text","scope":"column","target":"ingredients_text_fr_ocr_1573108349_result","treatment":"Drop; 98% null and only one distinct OCR string provides no usable signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a French-language OCR extraction of a product ingredients list, timestamped 1573108360 in the column name. Out of 50 rows, 98% are null and only a single non-null value exists (a single bakery product's ingredient declaration), giving cardinality 1 and entropy 0. The column is effectively empty and carries no discriminative signal.","role":"free_text","scope":"column","target":"ingredients_text_fr_ocr_1573108360","treatment":"Drop; 98% null with a single OCR string offers no usable signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to hold the OCR result of a French ingredients list (timestamped 1573109955), capturing the parsed text from a product label. Of 50 rows, 98% are null and only a single non-null value exists \u2014 a long French ingredients string for a butter/egg pastry product. With cardinality 1 and entropy 0, it carries essentially no information at this sample size.","role":"free_text","scope":"column","target":"ingredients_text_fr_ocr_1573109955_result","treatment":"Drop; 98% null with a single OCR string offers no modelling signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to be a French OCR-extracted ingredients list (likely from food packaging), based on the column name and the single observed value containing French ingredient text like 'Farine de bl\u00e9, sucre, beurre frais'. It is almost entirely empty: 98% null across n=50, with only one non-null record and cardinality of 1, giving zero entropy. With a single observation it carries no analytical signal in this sample.","role":"free_text","scope":"column","target":"ingredients_text_fr_ocr_1573108349","treatment":"Drop; 98% null and only one unique value provides no usable signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be an OCR-extracted French ingredients list (timestamped 1573109955), likely from a product packaging scan. The column is almost entirely empty: 98% null across 50 rows, with only a single non-null value present, giving cardinality 1 and entropy 0. That lone value is a long, noisy free-text string typical of raw OCR output rather than a clean categorical label.","role":"free_text","scope":"column","target":"ingredients_text_fr_ocr_1573109955","treatment":"Drop; effectively empty with only one OCR string and no analytical signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be the OCR result of a French ingredients label (timestamped 1573107556), capturing extracted text from a product image. Of 50 rows, 98% are null and only a single non-null value exists \u2014 one French ingredient list for a butter/egg/flour pastry. With cardinality 1 and entropy 0, the column carries essentially no analytical signal.","role":"free_text","scope":"column","target":"ingredients_text_fr_ocr_1573107556_result","treatment":"Drop; 98% null with only one observed OCR string."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be the OCR-extracted French ingredients text from a timestamped scan run (1573108360), holding raw label transcriptions. With 98% nulls and only 1 non-null value across 50 rows, it is effectively empty \u2014 the single populated entry is a long French ingredient list for a butter/egg pastry product. Cardinality of 1 and entropy of 0 mean it carries no discriminative signal here.","role":"free_text","scope":"column","target":"ingredients_text_fr_ocr_1573108360_result","treatment":"Drop from modelling; if needed, merge with sibling OCR columns into a single ingredients_text field before NLP."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be an OCR-extracted French ingredients list (timestamped 1573107560), capturing the raw text from a product label. Out of 50 rows, 98% are null and only a single non-null value exists, an entry beginning 'Farine de bl\u00e9, sucre, beurre frais 9,5%...'. With cardinality 1 and entropy 0, the column carries effectively no signal in this sample.","role":"free_text","scope":"column","target":"ingredients_text_fr_ocr_1573107560","treatment":"Drop; 98% null with a single OCR string offers no usable signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This is a French-language OCR-extracted ingredients list, timestamped in the column name (1566920858), almost certainly from an Open Food Facts-style product dump. Out of 50 rows, 98% are null and only a single non-null value exists, a verbose ingredients string for a butter/egg pastry. With cardinality 1 and entropy 0, the column carries effectively no signal in this sample.","role":"free_text","scope":"column","target":"ingredients_text_fr_ocr_1566920858","treatment":"Drop; 98% null and only one distinct OCR string provides no usable signal."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","n","n_unique"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Lithuanian-locale generic name field, but it is effectively empty: 98% of the 50 rows are null and the single non-null value is the empty string. Cardinality is 1 and entropy is 0, so the column carries no information.","role":"metadata","scope":"column","target":"generic_name_lt","treatment":"Drop; the column is 98% null with a single empty-string value."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.cardinality","stats.top_value","stats.top_rate","n"],"model":"anthropic:claude-opus-4-7","narrative":"A Romanian-language ingredients-with-allergens text field, almost entirely empty in this sample. 98% of rows are null and the only non-null value observed is an empty string, giving a single unique value across n=50.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_ro","treatment":"Drop; effectively no signal at this sample size."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"Lithuanian packaging text field that is effectively empty in this sample: 98% null and the single non-null value is itself an empty string, giving cardinality 1 and zero entropy. There is no usable signal here.","role":"free_text","scope":"column","target":"packaging_text_lt","treatment":"Drop; no observed content."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Lithuanian-language ingredients text field, likely from a multilingual product catalog. It is effectively empty: 98% null across 50 rows, and the single non-null value is itself an empty string, giving cardinality 1 and zero entropy.","role":"free_text","scope":"column","target":"ingredients_text_lt","treatment":"Drop; no usable signal in this sample."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n","n_unique","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"The column 'origin_lt' is nearly entirely null, with a null_rate of 0.98 across 50 rows, leaving only a single non-null observation that is itself an empty string. With cardinality of 1, entropy of 0, and top_rate of 1.0, there is no usable signal here.","role":"metadata","scope":"column","target":"origin_lt","treatment":"Drop; effectively empty with no variance."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This column appears to be a Lithuanian-localized product name field, but it is effectively empty: 98% of the 50 rows are null and the single non-null value is itself an empty string. Cardinality is 1 with zero entropy, so it carries no information.","role":"metadata","scope":"column","target":"product_name_lt","treatment":"Drop; the column is 98% null with a single empty-string value."},{"confidence":"high","critiques":[],"evidence_keys":["null_rate","n_unique","stats.entropy","stats.top_value","stats.top_rate","top_values"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a Lithuanian-language ingredients text field with allergen annotations, but it is effectively empty in this sample. 98% of rows are null and the only non-null value observed is the empty string, giving zero entropy across n=50.","role":"free_text","scope":"column","target":"ingredients_text_with_allergens_lt","treatment":"Drop from analysis; insufficient non-null content to model."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.top_rate","stats.top_value"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be a French-language OCR extract of an ingredients list (chocolate product), captured at a specific timestamp suggested by the column suffix. Out of 50 rows, 98% are null and only 1 non-null value exists, making the column effectively a single-record artifact rather than a usable feature. The lone value is free-form text describing cacao paste, cocoa butter, sugar, milk powder, and allergen traces.","role":"free_text","scope":"column","target":"ingredients_text_fr_ocr_1713713129","treatment":"Drop; 98% null and only one observed value provides no signal."},{"confidence":"high","critiques":[],"evidence_keys":["n","n_unique","null_rate","stats.cardinality","stats.entropy","stats.top_rate","stats.top_value","alerts"],"model":"anthropic:claude-opus-4-7","narrative":"This appears to be the OCR result of a French ingredients list, captured at a single timestamp (1713713129) and stored as raw text. With null_rate 0.98, only 1 of 50 rows has a value, and that single observation is a chocolate ingredients statement (cocoa paste, cocoa powder, almonds, hazelnuts, soy lecithin). Cardinality is 1 and entropy is 0, so there is no variation to model from this column alone.","role":"free_text","scope":"column","target":"ingredients_text_fr_ocr_1713713129_result","treatment":"Drop; 98% null and only one distinct OCR string provides no signal."}],"providers":["anthropic:claude-opus-4-7"],"total_usage":{"completion_tokens":124120,"prompt_tokens":612721,"total_tokens":736841}},"language_counts":{},"meta":{"generated_at":"2026-05-01T18:08:04+00:00","mode":"full","row_count":50,"sampled_rows":50,"seed":42,"source":"/home/coolhand/html/datavis/data_trove/cache/wild/openfoodfacts_sample.json"},"notes":[],"saturn_version":"0.2.0","schema":{"_id":"categorical","_keywords":"unknown","abbreviated_product_name":"categorical","abbreviated_product_name_fr":"categorical","abbreviated_product_name_fr_imported":"categorical","abbreviated_product_name_imported":"categorical","added_countries_tags":"unknown","additives_n":"numeric","additives_original_tags":"unknown","additives_tags":"unknown","allergens":"categorical","allergens_from_ingredients":"categorical","allergens_from_user":"categorical","allergens_hierarchy":"unknown","allergens_imported":"categorical","allergens_lc":"categorical","allergens_tags":"unknown","amino_acids_prev_tags":"unknown","amino_acids_tags":"unknown","brands":"categorical","brands_imported":"categorical","brands_old":"categorical","brands_tags":"unknown","carbon_footprint_from_known_ingredients_debug":"categorical","carbon_footprint_percent_of_known_ingredients":"numeric","categories":"categorical","categories_hierarchy":"unknown","categories_imported":"categorical","categories_lc":"categorical","categories_old":"categorical","categories_properties":"unknown","categories_properties_tags":"unknown","categories_tags":"unknown","category_properties":"unknown","checked":"categorical","checkers":"unknown","checkers_tags":"unknown","ciqual_food_name_tags":"unknown","cities_tags":"unknown","code":"categorical","codes_tags":"unknown","compared_to_category":"categorical","complete":"numeric","completed_t":"numeric","completeness":"numeric","conservation_conditions":"categorical","conservation_conditions_fr":"categorical","conservation_conditions_fr_imported":"categorical","correctors":"unknown","correctors_tags":"unknown","countries":"categorical","countries_beforescanbot":"categorical","countries_hierarchy":"unknown","countries_imported":"categorical","countries_lc":"categorical","countries_tags":"unknown","created_t":"numeric","creator":"categorical","customer_service":"categorical","customer_service_fr":"categorical","customer_service_fr_imported":"categorical","data_quality_bugs_tags":"unknown","data_quality_completeness_tags":"unknown","data_quality_dimensions":"unknown","data_quality_errors_tags":"unknown","data_quality_info_tags":"unknown","data_quality_tags":"unknown","data_quality_warnings_tags":"unknown","data_sources":"categorical","data_sources_imported":"categorical","data_sources_tags":"unknown","debug_param_sorted_langs":"unknown","debug_tags":"unknown","ecoscore_data":"unknown","ecoscore_grade":"categorical","ecoscore_score":"numeric","ecoscore_tags":"unknown","editors":"unknown","editors_tags":"unknown","emb_code":"categorical","emb_codes":"categorical","emb_codes_20141016":"categorical","emb_codes_orig":"categorical","emb_codes_tags":"unknown","entry_dates_tags":"unknown","environment_impact_level":"categorical","environment_impact_level_tags":"unknown","expiration_date":"categorical","food_groups":"categorical","food_groups_tags":"unknown","forest_footprint_data":"unknown","fruits-vegetables-nuts_100g_estimate":"numeric","generic_name":"categorical","generic_name_ar":"categorical","generic_name_bg":"categorical","generic_name_ca":"categorical","generic_name_cs":"categorical","generic_name_da":"categorical","generic_name_de":"categorical","generic_name_dz":"categorical","generic_name_el":"categorical","generic_name_en":"categorical","generic_name_es":"categorical","generic_name_et":"categorical","generic_name_fi":"categorical","generic_name_fr":"categorical","generic_name_fr_imported":"categorical","generic_name_he":"categorical","generic_name_hu":"categorical","generic_name_it":"categorical","generic_name_ja":"categorical","generic_name_lc":"categorical","generic_name_lt":"categorical","generic_name_nb":"categorical","generic_name_nl":"categorical","generic_name_pl":"categorical","generic_name_pt":"categorical","generic_name_ro":"categorical","generic_name_ru":"categorical","generic_name_sk":"categorical","generic_name_sl":"categorical","generic_name_sr":"categorical","generic_name_sv":"categorical","generic_name_th":"categorical","generic_name_uk":"categorical","generic_name_ur":"categorical","generic_name_xx":"categorical","generic_name_xx_debug_tags":"unknown","generic_name_zh":"categorical","generic_name_zh_debug_tags":"unknown","grades":"unknown","id":"categorical","image_front_small_url":"categorical","image_front_thumb_url":"categorical","image_front_url":"categorical","image_small_url":"categorical","image_thumb_url":"categorical","image_url":"categorical","images":"unknown","informers":"unknown","informers_tags":"unknown","ingredients":"unknown","ingredients_analysis":"unknown","ingredients_analysis_tags":"unknown","ingredients_debug":"unknown","ingredients_from_or_that_may_be_from_palm_oil_n":"numeric","ingredients_from_palm_oil_n":"numeric","ingredients_from_palm_oil_tags":"unknown","ingredients_hierarchy":"unknown","ingredients_ids_debug":"unknown","ingredients_lc":"categorical","ingredients_n":"numeric","ingredients_n_tags":"unknown","ingredients_non_nutritive_sweeteners_n":"numeric","ingredients_original_tags":"unknown","ingredients_percent_analysis":"numeric","ingredients_sweeteners_n":"numeric","ingredients_tags":"unknown","ingredients_text":"categorical","ingredients_text_ar":"categorical","ingredients_text_bg":"categorical","ingredients_text_ca":"categorical","ingredients_text_cs":"categorical","ingredients_text_da":"categorical","ingredients_text_de":"categorical","ingredients_text_de_ocr_1548767354":"categorical","ingredients_text_de_ocr_1548767354_result":"categorical","ingredients_text_de_ocr_1559410715":"categorical","ingredients_text_de_ocr_1559410715_result":"categorical","ingredients_text_de_ocr_1648897071":"categorical","ingredients_text_de_ocr_1648897071_result":"categorical","ingredients_text_de_ocr_1648990410":"categorical","ingredients_text_de_ocr_1648990410_result":"categorical","ingredients_text_debug":"categorical","ingredients_text_debug_tags":"unknown","ingredients_text_dz":"categorical","ingredients_text_el":"categorical","ingredients_text_en":"categorical","ingredients_text_es":"categorical","ingredients_text_es_ocr_1548767061":"categorical","ingredients_text_es_ocr_1548767061_result":"categorical","ingredients_text_et":"categorical","ingredients_text_fi":"categorical","ingredients_text_fr":"categorical","ingredients_text_fr_imported":"categorical","ingredients_text_fr_ocr_1561814324":"categorical","ingredients_text_fr_ocr_1561814324_result":"categorical","ingredients_text_fr_ocr_1566920858":"categorical","ingredients_text_fr_ocr_1566920858_result":"categorical","ingredients_text_fr_ocr_1573107556":"categorical","ingredients_text_fr_ocr_1573107556_result":"categorical","ingredients_text_fr_ocr_1573107560":"categorical","ingredients_text_fr_ocr_1573107560_result":"categorical","ingredients_text_fr_ocr_1573108346":"categorical","ingredients_text_fr_ocr_1573108346_result":"categorical","ingredients_text_fr_ocr_1573108349":"categorical","ingredients_text_fr_ocr_1573108349_result":"categorical","ingredients_text_fr_ocr_1573108360":"categorical","ingredients_text_fr_ocr_1573108360_result":"categorical","ingredients_text_fr_ocr_1573109955":"categorical","ingredients_text_fr_ocr_1573109955_result":"categorical","ingredients_text_fr_ocr_1624039072":"categorical","ingredients_text_fr_ocr_1624039072_result":"categorical","ingredients_text_fr_ocr_1713713129":"categorical","ingredients_text_fr_ocr_1713713129_result":"categorical","ingredients_text_he":"categorical","ingredients_text_hu":"categorical","ingredients_text_hu_ocr_1571428260":"categorical","ingredients_text_hu_ocr_1571428260_result":"categorical","ingredients_text_it":"categorical","ingredients_text_it_ocr_1559410715":"categorical","ingredients_text_it_ocr_1559410715_result":"categorical","ingredients_text_ja":"categorical","ingredients_text_lc":"categorical","ingredients_text_lt":"categorical","ingredients_text_nb":"categorical","ingredients_text_nl":"categorical","ingredients_text_nl_ocr_1675675383":"categorical","ingredients_text_nl_ocr_1675675383_result":"categorical","ingredients_text_pl":"categorical","ingredients_text_pt":"categorical","ingredients_text_ro":"categorical","ingredients_text_ru":"categorical","ingredients_text_sk":"categorical","ingredients_text_sl":"categorical","ingredients_text_sr":"categorical","ingredients_text_sv":"categorical","ingredients_text_th":"categorical","ingredients_text_uk":"categorical","ingredients_text_ur":"categorical","ingredients_text_with_allergens":"categorical","ingredients_text_with_allergens_ar":"categorical","ingredients_text_with_allergens_bg":"categorical","ingredients_text_with_allergens_ca":"categorical","ingredients_text_with_allergens_cs":"categorical","ingredients_text_with_allergens_da":"categorical","ingredients_text_with_allergens_de":"categorical","ingredients_text_with_allergens_el":"categorical","ingredients_text_with_allergens_en":"categorical","ingredients_text_with_allergens_es":"categorical","ingredients_text_with_allergens_et":"categorical","ingredients_text_with_allergens_fi":"categorical","ingredients_text_with_allergens_fr":"categorical","ingredients_text_with_allergens_he":"categorical","ingredients_text_with_allergens_hu":"categorical","ingredients_text_with_allergens_it":"categorical","ingredients_text_with_allergens_ja":"categorical","ingredients_text_with_allergens_lc":"categorical","ingredients_text_with_allergens_lt":"categorical","ingredients_text_with_allergens_nb":"categorical","ingredients_text_with_allergens_nl":"categorical","ingredients_text_with_allergens_pl":"categorical","ingredients_text_with_allergens_pt":"categorical","ingredients_text_with_allergens_ro":"categorical","ingredients_text_with_allergens_ru":"categorical","ingredients_text_with_allergens_sk":"categorical","ingredients_text_with_allergens_sl":"categorical","ingredients_text_with_allergens_sr":"categorical","ingredients_text_with_allergens_sv":"categorical","ingredients_text_with_allergens_th":"categorical","ingredients_text_with_allergens_uk":"categorical","ingredients_text_xx":"categorical","ingredients_text_xx_debug_tags":"unknown","ingredients_text_zh":"categorical","ingredients_text_zh_debug_tags":"unknown","ingredients_that_may_be_from_palm_oil_n":"numeric","ingredients_that_may_be_from_palm_oil_tags":"unknown","ingredients_with_specified_percent_n":"numeric","ingredients_with_specified_percent_sum":"numeric","ingredients_with_unspecified_percent_n":"numeric","ingredients_with_unspecified_percent_sum":"numeric","ingredients_without_ciqual_codes":"unknown","ingredients_without_ciqual_codes_n":"numeric","ingredients_without_ecobalyse_ids":"unknown","ingredients_without_ecobalyse_ids_n":"numeric","interface_version_created":"categorical","interface_version_modified":"categorical","known_ingredients_n":"numeric","labels":"categorical","labels_hierarchy":"unknown","labels_imported":"categorical","labels_lc":"categorical","labels_old":"categorical","labels_tags":"unknown","lang":"categorical","lang_imported":"categorical","languages":"unknown","languages_codes":"unknown","languages_hierarchy":"unknown","languages_tags":"unknown","last_check_dates_tags":"unknown","last_checked_t":"numeric","last_checker":"categorical","last_edit_dates_tags":"unknown","last_editor":"categorical","last_image_dates_tags":"unknown","last_image_t":"numeric","last_modified_by":"categorical","last_modified_t":"numeric","last_updated_t":"numeric","lc":"categorical","lc_imported":"categorical","link":"categorical","main_countries_tags":"unknown","manufacturing_places":"categorical","manufacturing_places_tags":"unknown","max_imgid":"categorical","minerals_prev_tags":"unknown","minerals_tags":"unknown","misc_tags":"unknown","no_nutrition_data":"categorical","no_nutrition_data_imported":"categorical","nova_group":"numeric","nova_group_debug":"categorical","nova_group_error":"categorical","nova_groups":"categorical","nova_groups_markers":"unknown","nova_groups_tags":"unknown","nucleotides_prev_tags":"unknown","nucleotides_tags":"unknown","nutrient_levels":"unknown","nutrient_levels_tags":"unknown","nutriments":"unknown","nutriments_estimated":"unknown","nutriscore":"unknown","nutriscore_2021_tags":"unknown","nutriscore_2023_tags":"unknown","nutriscore_data":"unknown","nutriscore_grade":"categorical","nutriscore_grade_producer":"categorical","nutriscore_grade_producer_imported":"categorical","nutriscore_score":"numeric","nutriscore_score_opposite":"numeric","nutriscore_tags":"unknown","nutriscore_version":"categorical","nutrition_data":"categorical","nutrition_data_per":"categorical","nutrition_data_per_imported":"categorical","nutrition_data_prepared":"categorical","nutrition_data_prepared_per":"categorical","nutrition_data_prepared_per_imported":"categorical","nutrition_grade_fr":"categorical","nutrition_grades":"categorical","nutrition_grades_tags":"unknown","nutrition_score_beverage":"numeric","nutrition_score_debug":"categorical","nutrition_score_warning_fruits_vegetables_legumes_estimate_from_ingredients":"numeric","nutrition_score_warning_fruits_vegetables_legumes_estimate_from_ingredients_value":"numeric","nutrition_score_warning_fruits_vegetables_nuts_estimate_from_ingredients":"numeric","nutrition_score_warning_fruits_vegetables_nuts_estimate_from_ingredients_value":"numeric","nutrition_score_warning_no_fiber":"numeric","nutrition_score_warning_nutriments_estimated":"numeric","obsolete":"categorical","obsolete_imported":"categorical","obsolete_since_date":"categorical","origin":"categorical","origin_ar":"categorical","origin_bg":"categorical","origin_ca":"categorical","origin_cs":"categorical","origin_da":"categorical","origin_de":"categorical","origin_el":"categorical","origin_en":"categorical","origin_es":"categorical","origin_et":"categorical","origin_fi":"categorical","origin_fr":"categorical","origin_fr_imported":"categorical","origin_he":"categorical","origin_hu":"categorical","origin_it":"categorical","origin_ja":"categorical","origin_lt":"categorical","origin_nb":"categorical","origin_nl":"categorical","origin_pl":"categorical","origin_pt":"categorical","origin_ro":"categorical","origin_ru":"categorical","origin_sk":"categorical","origin_sl":"categorical","origin_sr":"categorical","origin_sv":"categorical","origin_th":"categorical","origin_uk":"categorical","origin_ur":"categorical","origin_xx":"categorical","origins":"categorical","origins_fr":"categorical","origins_hierarchy":"unknown","origins_lc":"categorical","origins_old":"categorical","origins_tags":"unknown","other_nutritional_substances_prev_tags":"unknown","other_nutritional_substances_tags":"unknown","owner":"categorical","owner_fields":"unknown","owner_imported":"categorical","owners_tags":"categorical","packaging":"categorical","packaging_hierarchy":"unknown","packaging_imported":"categorical","packaging_lc":"categorical","packaging_materials_tags":"unknown","packaging_old":"categorical","packaging_old_before_taxonomization":"categorical","packaging_recycling_tags":"unknown","packaging_shapes_tags":"unknown","packaging_tags":"unknown","packaging_text":"categorical","packaging_text_ar":"categorical","packaging_text_bg":"categorical","packaging_text_ca":"categorical","packaging_text_cs":"categorical","packaging_text_da":"categorical","packaging_text_de":"categorical","packaging_text_el":"categorical","packaging_text_en":"categorical","packaging_text_es":"categorical","packaging_text_et":"categorical","packaging_text_fi":"categorical","packaging_text_fr":"categorical","packaging_text_fr_imported":"categorical","packaging_text_he":"categorical","packaging_text_hu":"categorical","packaging_text_it":"categorical","packaging_text_ja":"categorical","packaging_text_lt":"categorical","packaging_text_nb":"categorical","packaging_text_nl":"categorical","packaging_text_pl":"categorical","packaging_text_pt":"categorical","packaging_text_ro":"categorical","packaging_text_ru":"categorical","packaging_text_sk":"categorical","packaging_text_sl":"categorical","packaging_text_sr":"categorical","packaging_text_sv":"categorical","packaging_text_th":"categorical","packaging_text_uk":"categorical","packaging_text_ur":"categorical","packaging_text_xx":"categorical","packagings":"unknown","packagings_complete":"numeric","packagings_materials":"unknown","packagings_materials_main":"categorical","packagings_n":"numeric","photographers":"unknown","photographers_tags":"unknown","pnns_groups_1":"categorical","pnns_groups_1_tags":"unknown","pnns_groups_2":"categorical","pnns_groups_2_tags":"unknown","popularity_key":"numeric","popularity_tags":"unknown","preparation":"categorical","preparation_fr":"categorical","preparation_fr_imported":"categorical","producer_version_id":"categorical","producer_version_id_imported":"categorical","product":"unknown","product_name":"categorical","product_name_ar":"categorical","product_name_bg":"categorical","product_name_ca":"categorical","product_name_cs":"categorical","product_name_da":"categorical","product_name_de":"categorical","product_name_dz":"categorical","product_name_el":"categorical","product_name_en":"categorical","product_name_es":"categorical","product_name_et":"categorical","product_name_fi":"categorical","product_name_fr":"categorical","product_name_fr_imported":"categorical","product_name_he":"categorical","product_name_hu":"categorical","product_name_it":"categorical","product_name_ja":"categorical","product_name_lc":"categorical","product_name_lt":"categorical","product_name_nb":"categorical","product_name_nl":"categorical","product_name_pl":"categorical","product_name_pt":"categorical","product_name_ro":"categorical","product_name_ru":"categorical","product_name_sk":"categorical","product_name_sl":"categorical","product_name_sr":"categorical","product_name_sv":"categorical","product_name_th":"categorical","product_name_uk":"categorical","product_name_ur":"categorical","product_name_xx":"categorical","product_name_xx_debug_tags":"unknown","product_name_zh":"categorical","product_name_zh_debug_tags":"unknown","product_quantity":"categorical","product_quantity_unit":"categorical","product_type":"categorical","purchase_places":"categorical","purchase_places_tags":"unknown","quantity":"categorical","quantity_imported":"categorical","removed_countries_tags":"unknown","rev":"numeric","scans_n":"numeric","schema_version":"numeric","scores":"unknown","selected_images":"unknown","serving_quantity":"categorical","serving_quantity_unit":"categorical","serving_size":"categorical","serving_size_imported":"categorical","sortkey":"numeric","sources":"unknown","sources_fields":"unknown","specific_ingredients":"unknown","states":"categorical","states_hierarchy":"unknown","states_tags":"unknown","stores":"categorical","stores_tags":"unknown","taxonomies_enhancer_tags":"unknown","teams":"categorical","teams_tags":"unknown","traces":"categorical","traces_from_ingredients":"categorical","traces_from_user":"categorical","traces_hierarchy":"unknown","traces_imported":"categorical","traces_lc":"categorical","traces_tags":"unknown","unique_scans_n":"numeric","unknown_ingredients_n":"numeric","unknown_nutrients_tags":"unknown","update_key":"categorical","url":"categorical","vitamins_prev_tags":"unknown","vitamins_tags":"unknown","weighers_tags":"unknown","weighters_tags":"unknown"}}
