Explorar el Código

Enhance schema with extensive vitamins, minerals, and dietary indicators for specialized diets

lanfr144 hace 2 semanas
padre
commit
efd0c0e998
Se han modificado 2 ficheros con 22 adiciones y 3 borrados
  1. 5 2
      ingest_csv.py
  2. 17 1
      setup_db.py

+ 5 - 2
ingest_csv.py

@@ -32,8 +32,11 @@ def ingest_file(filename, engine):
 
     required_columns = [
         'code', 'product_name', 'generic_name', 'brands', 'allergens', 'ingredients_text',
-        'proteins_100g', 'fat_100g', 'carbohydrates_100g', 'sugars_100g', 'sodium_100g', 
-        'energy-kcal_100g', 'vitamin-c_100g', 'iron_100g', 'calcium_100g'
+        'proteins_100g', 'fat_100g', 'carbohydrates_100g', 'sugars_100g', 'sodium_100g', 'salt_100g',
+        'energy-kcal_100g', 'vitamin-a_100g', 'vitamin-d_100g', 'vitamin-e_100g', 'vitamin-k_100g',
+        'vitamin-c_100g', 'vitamin-b1_100g', 'vitamin-b2_100g', 'vitamin-pp_100g', 'vitamin-b6_100g',
+        'vitamin-b9_100g', 'vitamin-b12_100g', 'calcium_100g', 'iron_100g', 'magnesium_100g',
+        'zinc_100g', 'potassium_100g', 'cholesterol_100g', 'fiber_100g'
     ]
 
     for chunk in pd.read_csv(filename, sep='\t', dtype=str, chunksize=chunk_size, on_bad_lines='skip', low_memory=False, encoding='utf-8'):

+ 17 - 1
setup_db.py

@@ -144,10 +144,26 @@ def run_db_setup():
         carbohydrates_100g DOUBLE NULL,
         sugars_100g DOUBLE NULL,
         sodium_100g DOUBLE NULL,
+        salt_100g DOUBLE NULL,
         `energy-kcal_100g` DOUBLE NULL,
+        `vitamin-a_100g` DOUBLE NULL,
+        `vitamin-d_100g` DOUBLE NULL,
+        `vitamin-e_100g` DOUBLE NULL,
+        `vitamin-k_100g` DOUBLE NULL,
         `vitamin-c_100g` DOUBLE NULL,
-        iron_100g DOUBLE NULL,
+        `vitamin-b1_100g` DOUBLE NULL,
+        `vitamin-b2_100g` DOUBLE NULL,
+        `vitamin-pp_100g` DOUBLE NULL,
+        `vitamin-b6_100g` DOUBLE NULL,
+        `vitamin-b9_100g` DOUBLE NULL,
+        `vitamin-b12_100g` DOUBLE NULL,
         calcium_100g DOUBLE NULL,
+        iron_100g DOUBLE NULL,
+        magnesium_100g DOUBLE NULL,
+        zinc_100g DOUBLE NULL,
+        potassium_100g DOUBLE NULL,
+        cholesterol_100g DOUBLE NULL,
+        fiber_100g DOUBLE NULL,
         FULLTEXT idx_search (product_name, ingredients_text)
     ) ENGINE=InnoDB;
     """)