import gradio as gr gr.load("models/WGNW/Llama-2-ko-7b-Chat-auto-gptq-4bit").launch()