import gradio as gr gr.load("models/mlx-community/Llama-3.2-1B-Instruct-4bit").launch()