import gradio as gr def greet(input_text): # Example call to a compiled llama.cpp binary (replace with real model path) # subprocess.run(["./llama.cpp/main", "-m", "models/llama-7b.gguf", "-p", input_text]) return f"Llama.cpp would process: {input_text}" def run(): demo = gr.Interface( fn=greet, inputs=gr.Textbox(label="Enter text"), outputs="text", title="Llama.cpp + Gradio Demo" ) demo.launch(server_name="0.0.0.0", server_port=7860) if __name__ == "__main__": run()