import gradio gradio.load("models/upstage/Llama-2-70b-instruct").queue(max_size=3).launch(debug=True)