import gradio as gr gr.load( "models/ibm-granite/granite-3b-code-base-128k", provider="hf-inference", ).launch()