멀티모달 AI 어시스턴트

필요한 모듈 설치하기

!pip install openai
!pip install gradio

멀티모달 AI 템플릿

import gradio as gr

def process_multimodal(text, image, audio):
    results = []

    if text:
        results.append(f"📝 Text analysis: {len(text)} characters processed")

    if image is not None:
        results.append("🖼️ Image uploaded and analyzed")

    if audio is not None:
        results.append("🎵 Audio file processed")

    return "\n".join(results) if results else "Please provide some input!"

with gr.Blocks(
    theme=gr.themes.Default(
        primary_hue="blue",
        secondary_hue="gray",
        neutral_hue="slate"
    ),
    css="""
    .gradio-container {
        font-family: 'Inter', sans-serif;
    }
    .tab-nav button {
        font-weight: 600;
    }
    """
) as demo:

    gr.Markdown("""
    # 🤖 Multimodal AI Assistant
    ### Upload text, images, or audio for AI analysis
    """)

    with gr.Row():
        with gr.Column():
            text_input = gr.Textbox(
                label="💬 Text Input",
                placeholder="Enter your text here...",
                lines=4
            )

            image_input = gr.Image(
                label="📸 Image Upload",
                type="pil"
            )

            audio_input = gr.Audio(
                label="🎤 Audio Upload",
                type="filepath"
            )

            process_btn = gr.Button(
                "🚀 Process All",
                variant="primary",
                size="lg"
            )

        with gr.Column():
            output = gr.Textbox(
                label="📊 Analysis Results",
                lines=10,
                interactive=False
            )

    process_btn.click(
        process_multimodal,
        inputs=[text_input, image_input, audio_input],
        outputs=output
    )

demo.launch()