recetas-saludables-ia2

Sleeping

App Files Files Community

Update app.py

by LauraM655 - opened Dec 11, 2025

base: refs/heads/main

←

from: refs/pr/1

Discussion Files changed

+117

-583

Files changed (1) hide show

app.py +117 -583

app.py CHANGED Viewed

@@ -4,7 +4,6 @@ import pandas as pd
 from sentence_transformers import SentenceTransformer
 from sklearn.metrics.pairwise import cosine_similarity
 import plotly.express as px
-from isodate import parse_duration, ISO8601Error
 import ast
 import numpy as np
 from transformers import pipeline
@@ -17,6 +16,7 @@ from PIL import Image
 import requests
 from io import BytesIO
 import traceback
 warnings.filterwarnings('ignore')
@@ -31,43 +31,15 @@ st.set_page_config(
 # CSS mejorado
 st.markdown("""
 <style>
-    .main {background-color: #f8f9fa;}
-    .stButton>button {
-        background-color: #28a745;
-        color: white;
-        border-radius: 10px;
-        padding: 0.5rem 1rem;
-        font-weight: 600;
-        border: none;
-        transition: all 0.3s;
-    }
-    .stButton>button:hover {
-        background-color: #218838;
-        transform: translateY(-2px);
-        box-shadow: 0 4px 12px rgba(40, 167, 69, 0.2);
-    }
     .recipe-card {
-        background: white;
         border-radius: 10px;
-        padding: 1.5rem;
-        margin: 1rem 0;
-        box-shadow: 0 2px 8px rgba(0,0,0,0.1);
-        border-left: 4px solid #28a745;
     }
-    .highlight {
-        background-color: #e8f5e9;
-        padding: 0.5rem;
-        border-radius: 5px;
-        margin: 0.5rem 0;
-    }
-    .ingredient-item {
-        padding: 0.3rem 0;
-        border-bottom: 1px solid #eee;
-    }
-    .instruction-step {
-        margin: 0.5rem 0;
-        padding-left: 1rem;
-        border-left: 3px solid #28a745;
     }
 </style>
 """, unsafe_allow_html=True)
@@ -75,626 +47,188 @@ st.markdown("""
 # ==================== FUNCIONES AUXILIARES ====================
 def parse_ingredient_string(ing_str):
-    """Parsear cadena de ingredientes del formato R a lista Python"""
     try:
-        if isinstance(ing_str, list):
-            return ing_str
-        if not isinstance(ing_str, str):
-            return []
-        # Limpiar la cadena
-        ing_str = ing_str.strip()
-        # Caso 1: Formato R c("item1", "item2")
-        if ing_str.startswith('c('):
-            # Remover c( y el último paréntesis
-            ing_str = ing_str[2:-1] if ing_str.endswith(')') else ing_str[2:]
-            # Reemplazar comillas dobles escapadas
-            ing_str = ing_str.replace('\\"', '"')
-            # Intentar evaluar como lista Python
-            try:
-                result = ast.literal_eval(ing_str)
-                if isinstance(result, list):
-                    return [str(item).strip('"\'') for item in result]
-                else:
-                    return [str(result).strip('"\'')]
-            except:
-                # Si falla, dividir por comas
-                items = [item.strip().strip('"\'') for item in ing_str.split(',')]
-                return [item for item in items if item and item != 'NA']
-        # Caso 2: Lista JSON-like
-        elif ing_str.startswith('[') and ing_str.endswith(']'):
-            try:
-                result = json.loads(ing_str)
-                if isinstance(result, list):
-                    return [str(item) for item in result]
-            except:
-                pass
-        # Caso 3: Separado por comas simple
-        items = [item.strip().strip('"\'') for item in ing_str.split(',')]
-        items = [item for item in items if item and item not in ['NA', 'character(0)']]
-        return items
-    except Exception as e:
-        st.warning(f"Error al parsear ingredientes: {e}")
         return []
 def parse_instruction_string(instr_str):
-    """Parsear instrucciones del formato R a lista Python"""
     try:
-        if isinstance(instr_str, list):
-            return instr_str
-        if not isinstance(instr_str, str):
-            return []
-        instr_str = instr_str.strip()
-        # Si es una cadena JSON-like o lista Python
-        if (instr_str.startswith('[') and instr_str.endswith(']')):
-            try:
-                result = json.loads(instr_str)
-                if isinstance(result, list):
-                    return [str(item) for item in result]
-            except:
-                pass
-        # Dividir por puntos o números
-        instructions = []
-        # Patrón para dividir por números (1., 2., etc.) o puntos
-        patterns = [r'\d+\.', r'\d+\)', r'Step \d+:', r'\n']
-        for pattern in patterns:
-            if re.search(pattern, instr_str):
-                split_instr = re.split(pattern, instr_str)
-                instructions = [instr.strip() for instr in split_instr if instr.strip()]
-                if len(instructions) > 1:
-                    break
-        # Si no se pudo dividir, usar toda la cadena como una instrucción
-        if not instructions:
-            instructions = [instr_str]
-        return instructions
-    except Exception as e:
-        st.warning(f"Error al parsear instrucciones: {e}")
-        return [str(instr_str)]
-def parse_image_string(img_str):
-    """Parsear URLs de imágenes"""
-    try:
-        if isinstance(img_str, list):
-            return img_str
-        if not isinstance(img_str, str):
-            return []
-        img_str = img_str.strip()
-        # Formato R c("url1", "url2")
-        if img_str.startswith('c('):
-            img_str = img_str[2:-1] if img_str.endswith(')') else img_str[2:]
-            img_str = img_str.replace('\\"', '"')
-            try:
-                result = ast.literal_eval(img_str)
-                if isinstance(result, list):
-                    return [str(item).strip('"\'') for item in result]
-            except:
-                pass
-        # Lista JSON
-        elif img_str.startswith('[') and img_str.endswith(']'):
-            try:
-                result = json.loads(img_str)
-                if isinstance(result, list):
-                    return [str(item) for item in result]
-            except:
-                pass
-        # URL única
-        if img_str.startswith('http'):
-            return [img_str]
-        return []
-    except Exception as e:
         return []
-@st.cache_resource(show_spinner="Cargando modelo de traducción...")
-def load_translator():
-    return pipeline("translation_en_to_es", model="Helsinki-NLP/opus-mt-en-es")
 @st.cache_resource(show_spinner="Cargando modelo de embeddings...")
 def load_embedding_model():
-    return SentenceTransformer('all-MiniLM-L6-v2')
 @lru_cache(maxsize=1000)
-def traducir_texto_cached(texto):
-    """Cachea traducciones para mejorar rendimiento"""
-    if not texto or pd.isna(texto) or str(texto).strip() == '':
-        return ""
     try:
-        texto = str(texto)
-        if len(texto) > 500:
-            texto = texto[:497] + "..."
-        translator = load_translator()
-        return translator(texto, max_length=512)[0]['translation_text']
-    except Exception:
-        return texto
-def load_image_from_url(url, max_size=(400, 300)):
-    """Cargar imagen desde URL con manejo de errores"""
-    try:
-        if not url or not isinstance(url, str) or not url.startswith('http'):
-            return None
-        response = requests.get(url, timeout=5)
-        response.raise_for_status()
-        img = Image.open(BytesIO(response.content))
-        # Convertir a RGB si es necesario
-        if img.mode in ('RGBA', 'LA', 'P'):
-            img = img.convert('RGB')
-        # Redimensionar manteniendo aspecto
-        img.thumbnail(max_size, Image.Resampling.LANCZOS)
-        return img
-    except Exception:
-        return None
 # ==================== CARGA DE DATOS ====================
 @st.cache_data(show_spinner="Cargando y procesando datos de recetas...")
 def load_and_preprocess_data():
-    """Carga y preprocesa los datos con validación robusta"""
     try:
-        # Cargar dataset
-        st.info("Descargando dataset de recetas... Esto puede tomar unos segundos.")
-        ds = load_dataset("AkashPS11/recipes_data_food.com", trust_remote_code=True)
-        df = ds['train'].to_pandas() if 'train' in ds else ds.to_pandas()
-        # Limitar tamaño para mejor rendimiento pero mantener variedad
         df = df.head(8000).copy()
         # Procesar ingredientes
-        df['ingredients_parsed'] = df['RecipeIngredientParts'].apply(parse_ingredient_string)
-        df['ingredients_str'] = df['ingredients_parsed'].apply(
-            lambda x: ' '.join([str(i).lower() for i in x]) if x else ''
-        )
-        # Procesar cantidades
-        df['quantities_parsed'] = df['RecipeIngredientQuantities'].apply(parse_ingredient_string)
         # Procesar instrucciones
-        df['instructions_parsed'] = df['RecipeInstructions'].apply(parse_instruction_string)
-        # Procesar imágenes
-        df['images_parsed'] = df['Images'].apply(parse_image_string)
-        # Filtrar recetas saludables
-        mask = (
-            (df['Calories'] < 800) |
-            df['Keywords'].str.contains('healthy|low fat|vegan|low calorie|vegetarian',
-                                      na=False, case=False, regex=True)
-        )
-        df = df[mask].copy()
-        # Procesar tiempos con manejo de errores
-        def parse_time(time_str):
-            try:
-                if pd.isna(time_str) or not isinstance(time_str, str):
-                    return 0
-                return parse_duration(time_str).total_seconds() / 60
-            except (ISO8601Error, AttributeError, TypeError):
-                return 0
-        df['total_minutes'] = df['TotalTime'].apply(parse_time)
-        df['prep_minutes'] = df['PrepTime'].apply(parse_time)
-        df['cook_minutes'] = df['CookTime'].apply(parse_time)
-        # Limpiar valores NaN
-        numeric_cols = ['Calories', 'FatContent', 'SugarContent', 'ProteinContent', 'AggregatedRating']
-        for col in numeric_cols:
-            if col in df.columns:
-                df[col] = pd.to_numeric(df[col], errors='coerce').fillna(0)
-        # Pre-calcular embeddings para mejor rendimiento
-        st.info("Calculando embeddings para búsqueda rápida...")
         model = load_embedding_model()
-        ingredients_texts = df['ingredients_str'].fillna('').tolist()
-        # Calcular embeddings en lotes para evitar memory error
         batch_size = 100
         embeddings = []
         for i in range(0, len(ingredients_texts), batch_size):
             batch = ingredients_texts[i:i+batch_size]
             batch_embeddings = model.encode(batch, show_progress_bar=False)
             embeddings.extend(batch_embeddings)
-        df['embedding'] = list(embeddings)
-        st.success(f"✅ Dataset cargado: {len(df)} recetas procesadas")
         return df
     except Exception as e:
-        st.error(f"Error crítico al cargar datos: {str(e)}")
-        st.error(traceback.format_exc())
         return pd.DataFrame()
 # ==================== FUNCIONES DE RECOMENDACIÓN ====================
-def recommend_recipes_optimized(user_ingredients, category="", top_k=5, max_cal=500, is_vegan=False, max_time=60):
-    """Función de recomendación optimizada con embeddings pre-calculados"""
     try:
         if df.empty:
             return pd.DataFrame()
-        # Crear embedding de consulta del usuario
         model = load_embedding_model()
-        user_text = ' '.join([str(i).lower() for i in user_ingredients])
         user_embedding = model.encode(user_text)
-        # Calcular similitudes usando embeddings pre-calculados
-        embeddings = np.vstack(df['embedding'].values)
         similarities = cosine_similarity([user_embedding], embeddings)[0]
         df['similarity'] = similarities
-        # Aplicar filtros
-        mask = (
-            (df['Calories'] <= max_cal) &
-            (df['total_minutes'] <= max_time) &
-            (df['similarity'] > 0.1)  # Umbral más bajo para más resultados
-        )
-        if category and category != "":
-            mask &= df['RecipeCategory'].str.contains(category, case=False, na=False)
         if is_vegan:
-            mask &= df['Keywords'].str.contains('vegan', case=False, na=False)
-        filtered = df[mask].copy()
         if filtered.empty:
-            # Relajar filtros si no hay resultados
-            st.warning("No se encontraron recetas con esos filtros estrictos. Mostrando recetas más similares...")
-            filtered = df[df['similarity'] > 0.05].copy()
-        # Ordenar y retornar
-        recs = filtered.nlargest(top_k, ['similarity', 'AggregatedRating'])
         return recs
     except Exception as e:
         st.error(f"Error en recomendación: {str(e)}")
         return pd.DataFrame()
-def get_similar_recipes(recipe_index, top_n=5):
-    """Obtener recetas similares a una receta específica"""
-    try:
-        if df.empty or recipe_index not in df.index:
-            return pd.DataFrame()
-        # Obtener embedding de la receta de referencia
-        target_embedding = df.loc[recipe_index, 'embedding'].reshape(1, -1)
-        # Calcular similitudes con todas las recetas
-        embeddings = np.vstack(df['embedding'].values)
-        similarities = cosine_similarity(target_embedding, embeddings)[0]
-        # Obtener índices de las recetas más similares (excluyendo la receta misma)
-        similar_indices = np.argsort(similarities)[::-1][1:top_n+1]
-        similar_recipes = df.iloc[similar_indices].copy()
-        similar_recipes['similarity_to_recipe'] = similarities[similar_indices]
-        return similar_recipes
-    except Exception as e:
-        st.error(f"Error al buscar recetas similares: {str(e)}")
-        return pd.DataFrame()
 # ==================== INTERFAZ STREAMLIT ====================
-# Título y descripción
-st.title("🍎 Generador Inteligente de Recetas Saludables")
-st.markdown("""
-<div style='background-color: #e8f5e9; padding: 1rem; border-radius: 10px; margin: 1rem 0;'>
-    <h4 style='color: #2e7d32; margin: 0;'>✨ Instrucciones de uso:</h4>
-    <ol style='margin: 0.5rem 0 0 0; color: #555;'>
-        <li>Ingresa los ingredientes que tienes disponibles (separados por comas)</li>
-        <li>Ajusta los filtros según tus preferencias dietéticas</li>
-        <li>Haz clic en "🔍 Buscar Recetas" para obtener recomendaciones personalizadas</li>
-        <li>Explora cada receta haciendo clic en los detalles y busca recetas similares</li>
-    </ol>
-</div>
-""", unsafe_allow_html=True)
-# Cargar datos con spinner
-with st.spinner("Cargando base de datos de recetas..."):
     df = load_and_preprocess_data()
 if df.empty:
-    st.error("No se pudieron cargar los datos. Por favor, recarga la página.")
     st.stop()
-# ==================== BARRA LATERAL ====================
 with st.sidebar:
-    st.header("⚙️ Filtros Avanzados")
-    st.subheader("Preferencias Dietéticas")
-    max_cal = st.slider(
-        "Calorías máximas por porción",
-        100, 1000, 500,
-        help="Limita las recetas por contenido calórico"
-    )
-    max_time = st.slider(
-        "Tiempo máximo de preparación (minutos)",
-        10, 180, 60,
-        help="Incluye tiempo de preparación y cocción"
-    )
-    col1, col2 = st.columns(2)
-    with col1:
-        is_vegan = st.checkbox("🌱 Vegano", help="Solo recetas veganas")
-    with col2:
-        is_healthy = st.checkbox("💚 Saludable", value=True,
-                                help="Priorizar recetas marcadas como saludables")
-    st.subheader("Resultados")
-    top_k = st.select_slider(
-        "Número de recetas a mostrar",
-        options=[3, 5, 7, 10],
-        value=5
-    )
-    similar_recipes_count = st.slider(
-        "Recetas similares a mostrar",
-        2, 8, 3,
-        help="Número de recetas similares para mostrar en cada receta"
-    )
-    st.markdown("---")
-    st.markdown("### 📊 Estadísticas del Dataset")
-    st.metric("Recetas disponibles", len(df))
-    st.metric("Calorías promedio", f"{df['Calories'].mean():.0f}")
-    st.metric("Tiempo promedio", f"{df['total_minutes'].mean():.0f} min")
-# ==================== ENTRADA PRINCIPAL ====================
-st.header("🔍 Buscar Recetas por Ingredientes")
-col1, col2, col3 = st.columns([3, 2, 1])
-with col1:
-    user_input = st.text_input(
-        "Ingredientes disponibles (separados por comas):",
-        "chicken, rice, vegetables",
-        placeholder="Ej: tomate, pollo, arroz, cebolla, aceite de oliva"
-    )
-with col2:
-    # Extraer categorías únicas del dataset
-    unique_categories = [""] + sorted(df['RecipeCategory'].dropna().unique().tolist()[:20])
-    category_input = st.selectbox(
-        "Categoría (opcional):",
-        unique_categories,
-        format_func=lambda x: "Todas las categorías" if x == "" else x[:30]
-    )
-with col3:
-    st.markdown("<br>", unsafe_allow_html=True)
-    search_clicked = st.button("🔍 Buscar Recetas", use_container_width=True)
-# ==================== RESULTADOS ====================
-if search_clicked and user_input:
-    with st.spinner("Buscando recetas que coincidan con tus ingredientes..."):
-        ingredients = [ing.strip() for ing in user_input.split(',') if ing.strip()]
-        if not ingredients:
-            st.warning("Por favor, ingresa al menos un ingrediente.")
-        else:
-            recs = recommend_recipes_optimized(
-                ingredients,
-                category_input,
-                top_k=top_k,
-                max_cal=max_cal,
-                is_vegan=is_vegan,
-                max_time=max_time
-            )
-            st.session_state.recommendations = recs
-            st.session_state.search_made = True
-if 'recommendations' in st.session_state and not st.session_state.recommendations.empty:
-    recs = st.session_state.recommendations
-    st.success(f"✅ Encontradas {len(recs)} recetas que coinciden con tus criterios")
-    # Gráfico de visualización
-    if len(recs) > 1:
-        fig = px.scatter(
-            recs,
-            x='total_minutes',
-            y='Calories',
-            size='similarity',
-            color='RecipeCategory',
-            hover_name='Name',
-            title="📊 Distribución de Recetas Encontradas",
-            labels={
-                'total_minutes': 'Tiempo Total (minutos)',
-                'Calories': 'Calorías',
-                'RecipeCategory': 'Categoría'
-            }
-        )
-        fig.update_layout(
-            paper_bgcolor='rgba(0,0,0,0)',
-            plot_bgcolor='rgba(0,0,0,0)',
-            font_color='#333'
-        )
-        st.plotly_chart(fig, use_container_width=True)
-    # Mostrar recetas
-    st.header("🍽️ Recetas Recomendadas")
-    for idx, row in recs.iterrows():
-        recipe_index = row.name  # Índice en el DataFrame original
-        with st.container():
-            st.markdown(f"<div class='recipe-card'>", unsafe_allow_html=True)
-            # Título traducido
-            recipe_name = traducir_texto_cached(row['Name'])
-            st.markdown(f"### {recipe_name}")
-            # Metadatos en columnas
-            col_meta1, col_meta2, col_meta3, col_meta4 = st.columns(4)
-            with col_meta1:
-                st.metric("🔥 Calorías", f"{row['Calories']:.0f}")
-            with col_meta2:
-                st.metric("⏱️ Tiempo", f"{row['total_minutes']:.0f} min")
-            with col_meta3:
-                st.metric("⭐ Similitud", f"{row['similarity']:.3f}")
-            with col_meta4:
-                if 'AggregatedRating' in row and row['AggregatedRating'] > 0:
-                    st.metric("★ Valoración", f"{row['AggregatedRating']:.1f}/5")
-                else:
-                    st.metric("★ Valoración", "N/A")
-            # Contenedor principal con columnas para imagen y contenido
-            col_img, col_content = st.columns([1, 2])
-            with col_img:
-                # Mostrar imagen si está disponible
-                try:
-                    images = row['images_parsed'] if 'images_parsed' in row else []
-                    if images and len(images) > 0:
-                        img_url = images[0]
-                        img = load_image_from_url(img_url)
-                        if img:
-                            st.image(img, caption="Imagen de referencia", use_column_width=True)
-                        else:
-                            # Mostrar placeholder si no se puede cargar la imagen
-                            st.image("https://images.unsplash.com/photo-1490818387583-1baba5e638af?w=400&h=300&fit=crop",
-                                    caption="Imagen representativa", use_column_width=True)
-                    else:
-                        st.image("https://images.unsplash.com/photo-1490818387583-1baba5e638af?w-400&h=300&fit=crop",
-                                caption="Imagen representativa", use_column_width=True)
-                except Exception:
-                    st.image("https://images.unsplash.com/photo-1490818387583-1baba5e638af?w=400&h=300&fit=crop",
-                            caption="Imagen representativa", use_column_width=True)
-            with col_content:
-                # Descripción
-                if pd.notna(row.get('Description')) and str(row['Description']).strip():
-                    with st.expander("📝 Descripción", expanded=False):
-                        desc = traducir_texto_cached(row['Description'])
-                        st.write(desc)
-                # Ingredientes con cantidades
-                with st.expander("🛒 Ingredientes", expanded=False):
-                    try:
-                        ingredients_list = row['ingredients_parsed'] if 'ingredients_parsed' in row else []
-                        quantities_list = row['quantities_parsed'] if 'quantities_parsed' in row else []
-                        if ingredients_list and len(ingredients_list) > 0:
-                            # Mostrar ingredientes con cantidades si están disponibles
-                            if quantities_list and len(quantities_list) == len(ingredients_list):
-                                for qty, ing in zip(quantities_list, ingredients_list):
-                                    ing_translated = traducir_texto_cached(ing)
-                                    st.markdown(f"""
-                                    <div class='ingredient-item'>
-                                        <strong>{qty}</strong> - {ing_translated}
-                                    </div>
-                                    """, unsafe_allow_html=True)
-                            else:
-                                # Mostrar solo ingredientes
-                                for ing in ingredients_list:
-                                    ing_translated = traducir_texto_cached(ing)
-                                    st.markdown(f"""
-                                    <div class='ingredient-item'>
-                                        • {ing_translated}
-                                    </div>
-                                    """, unsafe_allow_html=True)
-                        else:
-                            st.info("No hay información de ingredientes disponible para esta receta.")
-                    except Exception as e:
-                        st.error(f"Error al mostrar ingredientes: {e}")
-                # Instrucciones
-                with st.expander("👩‍🍳 Instrucciones de Preparación", expanded=False):
-                    try:
-                        instructions = row['instructions_parsed'] if 'instructions_parsed' in row else []
-                        if instructions and len(instructions) > 0:
-                            for i, step in enumerate(instructions, 1):
-                                step_translated = traducir_texto_cached(step)
-                                st.markdown(f"""
-                                <div class='instruction-step'>
-                                    <strong>Paso {i}:</strong> {step_translated}
-                                </div>
-                                """, unsafe_allow_html=True)
-                        else:
-                            st.info("No hay instrucciones disponibles para esta receta.")
-                    except Exception as e:
-                        st.error(f"Error al mostrar instrucciones: {e}")
-                # Información nutricional
-                with st.expander("📊 Información Nutricional", expanded=False):
-                    nutri_data = {
-                        'Nutriente': ['Calorías', 'Grasa Total', 'Azúcares', 'Proteína'],
-                        'Cantidad': [
-                            f"{row.get('Calories', 0):.0f} kcal",
-                            f"{row.get('FatContent', 0):.1f} g" if pd.notna(row.get('FatContent')) else "N/A",
-                            f"{row.get('SugarContent', 0):.1f} g" if pd.notna(row.get('SugarContent')) else "N/A",
-                            f"{row.get('ProteinContent', 0):.1f} g" if pd.notna(row.get('ProteinContent')) else "N/A"
-                        ]
-                    }
-                    st.table(pd.DataFrame(nutri_data))
-            # Recetas similares
-            with st.expander(f"🔍 Ver {similar_recipes_count} recetas similares", expanded=False):
-                similar_recipes = get_similar_recipes(recipe_index, top_n=similar_recipes_count)
-                if not similar_recipes.empty:
-                    for sim_idx, sim_row in similar_recipes.iterrows():
-                        col_sim1, col_sim2 = st.columns([3, 1])
-                        with col_sim1:
-                            sim_name = traducir_texto_cached(sim_row['Name'])
-                            st.markdown(f"**{sim_name}**")
-                            st.caption(f"Calorías: {sim_row['Calories']:.0f} kcal • Tiempo: {sim_row['total_minutes']:.0f} min")
-                        with col_sim2:
-                            st.metric("Similitud", f"{sim_row['similarity_to_recipe']:.3f}")
-                        st.markdown("---")
-                else:
-                    st.info("No se encontraron recetas similares.")
-            st.markdown("</div>", unsafe_allow_html=True)
-            st.markdown("<br>", unsafe_allow_html=True)
-# ==================== INICIO CON RECETAS DE EJEMPLO ====================
-elif 'recommendations' not in st.session_state:
-    st.info("👈 Ingresa ingredientes y ajusta los filtros para comenzar, o usa nuestro ejemplo:")
-    # Mostrar algunas recetas de ejemplo al inicio
-    example_ingredients = ["chicken", "rice", "vegetables"]
-    if st.button("🍗 Usar ejemplo: Pollo con arroz y vegetales"):
-        with st.spinner("Buscando recetas de ejemplo..."):
-            example_recs = recommend_recipes_optimized(
-                example_ingredients,
-                top_k=3,
-                max_cal=600,
-                max_time=90
-            )
-            st.session_state.recommendations = example_recs
-            st.rerun()
-# ==================== PIE DE PÁGINA ====================
-st.markdown("---")
-st.markdown("""
-<div style='text-align: center; color: #666; padding: 1rem;'>
-    <p>🍎 <strong>Generador de Recetas Saludables con IA</strong> •
-    Usa modelos de machine learning para encontrar recetas perfectas basadas en tus ingredientes</p>
-    <p style='font-size: 0.9rem;'>Powered by Hugging Face 🤗 • Sentence Transformers • Streamlit</p>
-</div>
-""", unsafe_allow_html=True)

 from sentence_transformers import SentenceTransformer
 from sklearn.metrics.pairwise import cosine_similarity
 import plotly.express as px
 import ast
 import numpy as np
 from transformers import pipeline
 import requests
 from io import BytesIO
 import traceback
+import datetime
 warnings.filterwarnings('ignore')
 # CSS mejorado
 st.markdown("""
 <style>
     .recipe-card {
+        background-color: #f8f9fa;
+        padding: 20px;
         border-radius: 10px;
+        box-shadow: 0 2px 4px rgba(0,0,0,0.1);
+        margin-bottom: 20px;
     }
+    .stButton > button {
+        width: 100%;
     }
 </style>
 """, unsafe_allow_html=True)
 # ==================== FUNCIONES AUXILIARES ====================
 def parse_ingredient_string(ing_str):
+    """Parsear cadena de ingredientes separados por comas"""
     try:
+        if isinstance(ing_str, str):
+            items = [item.strip() for item in ing_str.split(',') if item.strip()]
+            return items
+        return []
+    except Exception:
         return []
 def parse_instruction_string(instr_str):
+    """Parsear instrucciones en pasos"""
     try:
+        if isinstance(instr_str, str):
+            # Dividir por puntos o números
+            steps = re.split(r'\.\s*|\n\s*', instr_str)
+            steps = [step.strip() for step in steps if step.strip()]
+            return steps
         return []
+    except Exception:
+        return [str(instr_str)]
 @st.cache_resource(show_spinner="Cargando modelo de embeddings...")
 def load_embedding_model():
+    return SentenceTransformer('paraphrase-multilingual-MiniLM-L12-v2')  # Multilingual for Spanish support
+@st.cache_resource(show_spinner="Cargando modelo para chatbot...")
+def load_chat_model():
+    return pipeline("text-generation", model="flax-community/gpt-2-spanish")  # Spanish-capable model for advice
 @lru_cache(maxsize=1000)
+def get_chat_response(query, context=""):
+    """Generar respuesta de chatbot con contexto RAG-like"""
+    model = load_chat_model()
+    prompt = f"Usuario: {query}\nContexto de receta: {context[:500]}\nAsistente: "
+    response = model(prompt, max_length=150, num_return_sequences=1)[0]['generated_text']
+    return response.split("Asistente: ")[-1].strip()
+def parse_duration_to_minutes(dur_str):
+    """Convertir HH:MM a minutos"""
     try:
+        if isinstance(dur_str, str) and ':' in dur_str:
+            h, m = map(int, dur_str.split(':'))
+            return h * 60 + m
+        return 0
+    except:
+        return 0
 # ==================== CARGA DE DATOS ====================
 @st.cache_data(show_spinner="Cargando y procesando datos de recetas...")
 def load_and_preprocess_data():
+    """Carga y preprocesa el dataset español"""
     try:
+        st.info("Descargando dataset de recetas españolas... Esto puede tomar unos segundos.")
+        ds = load_dataset("somosnlp/RecetasDeLaAbuela")
+        df = ds['train'].to_pandas()
+        # Limitar para rendimiento
         df = df.head(8000).copy()
         # Procesar ingredientes
+        df['ingredients_parsed'] = df['Ingredientes'].apply(parse_ingredient_string)
+        df['ingredients_str'] = df['ingredients_parsed'].apply(lambda x: ' '.join(x).lower())
         # Procesar instrucciones
+        df['instructions_parsed'] = df['Pasos'].apply(parse_instruction_string)
+        # Procesar tiempo
+        df['total_minutes'] = df['Duracion'].apply(parse_duration_to_minutes)
+        # Nutricional como filtro saludable (bajo en calorías, etc.)
+        df['is_healthy'] = df['Valor nutricional'].str.contains('Bajo en calorías|Bajo en grasas|vegetarianos|vegano', na=False, case=False)
+        # Pre-calcular embeddings
+        st.info("Calculando embeddings multilingües para búsqueda rápida...")
         model = load_embedding_model()
+        ingredients_texts = df['ingredients_str'].tolist()
         batch_size = 100
         embeddings = []
         for i in range(0, len(ingredients_texts), batch_size):
             batch = ingredients_texts[i:i+batch_size]
             batch_embeddings = model.encode(batch, show_progress_bar=False)
             embeddings.extend(batch_embeddings)
+        df['embedding'] = embeddings
+        st.success(f"Dataset cargado: {len(df)} recetas procesadas")
         return df
     except Exception as e:
+        st.error(f"Error al cargar datos: {str(e)}")
         return pd.DataFrame()
 # ==================== FUNCIONES DE RECOMENDACIÓN ====================
+def recommend_recipes_optimized(user_ingredients, category="", top_k=5, is_healthy=True, is_vegan=False, max_time=60):
+    """Recomendación con embeddings multilingües (RAG-like para synonyms)"""
     try:
         if df.empty:
             return pd.DataFrame()
         model = load_embedding_model()
+        user_text = ' '.join(user_ingredients).lower()
         user_embedding = model.encode(user_text)
+        embeddings = np.vstack(df['embedding'])
         similarities = cosine_similarity([user_embedding], embeddings)[0]
         df['similarity'] = similarities
+        mask = (df['similarity'] > 0.1) & (df['total_minutes'] <= max_time)
+        if category:
+            mask &= df['Categoria'].str.contains(category, case=False, na=False)
+        if is_healthy:
+            mask &= df['is_healthy']
         if is_vegan:
+            mask &= df['Valor nutricional'].str.contains('vegano|vegetarianos', case=False, na=False)
+        filtered = df[mask]
         if filtered.empty:
+            st.warning("Relajando filtros...")
+            filtered = df[df['similarity'] > 0.05]
+        recs = filtered.nlargest(top_k, 'similarity')
         return recs
     except Exception as e:
         st.error(f"Error en recomendación: {str(e)}")
         return pd.DataFrame()
 # ==================== INTERFAZ STREAMLIT ====================
+st.title("Generador Inteligente de Recetas Saludables")
+with st.spinner("Cargando base de datos..."):
     df = load_and_preprocess_data()
 if df.empty:
     st.stop()
+# Barra lateral
 with st.sidebar:
+    st.header("Filtros")
+    max_time = st.slider("Tiempo máximo (minutos)", 10, 120, 60)
+    is_healthy = st.checkbox("Solo recetas saludables", value=True)
+    is_vegan = st.checkbox("Vegano", value=False)
+    category = st.text_input("Categoría (ej. postres)")
+# Entrada usuario
+user_input = st.text_input("Ingresa ingredientes (separados por comas, en español):", "tomate, cebolla, pollo")
+user_ingredients = [i.strip().lower() for i in user_input.split(',') if i.strip()]
+if st.button("Buscar Recetas"):
+    recs = recommend_recipes_optimized(user_ingredients, category, 5, is_healthy, is_vegan, max_time)
+    if not recs.empty:
+        for idx, row in recs.iterrows():
+            with st.container():
+                st.markdown(f"### {row['Nombre']}")
+                st.write(f"**Tiempo:** {row['Duracion']} | **Porciones:** {row.get('Comensales', 'N/A')} | **Nutrición:** {row['Valor nutricional']}")
+                # Tabla de ingredientes
+                ing_df = pd.DataFrame(row['ingredients_parsed'], columns=["Ingrediente"])
+                st.table(ing_df)
+                # Instrucciones expandibles
+                for i, step in enumerate(row['instructions_parsed'], 1):
+                    with st.expander(f"Paso {i}"):
+                        st.write(step)
+                # Gráfico simple
+                fig = px.bar(x=['Tiempo Total'], y=[row['total_minutes']])
+                st.plotly_chart(fig, use_container_width=True)
+# Chatbot section
+st.header("Chatbot de Consejos")
+chat_input = st.chat_input("Pregunta sobre una receta o modificaciones:")
+if chat_input:
+    with st.chat_message("user"):
+        st.markdown(chat_input)
+    # Usar RAG: contexto de receta similar
+    similar_recs = recommend_recipes_optimized(user_input.split(','), top_k=1)
+    context = similar_recs['Pasos'].iloc[0] if not similar_recs.empty else ""
+    response = get_chat_response(chat_input, context)
+    with st.chat_message("assistant"):
+        st.markdown(response)