""" Call the deployed ZeroGPU Space API from localhost. pip install gradio_client export HF_TOKEN=hf_xxx # your Pro token -> uses YOUR ZeroGPU quota python space_client.py """ import os from gradio_client import Client, handle_file SPACE = os.environ.get("SPACE_ID", "chabab/qwen-agentworld-35b-zerogpu") # Passing hf_token charges the call to your account's ZeroGPU quota (recommended; # anonymous calls share a much smaller pool and may be rejected). client = Client(SPACE, token=os.environ.get("HF_TOKEN")) # --- text only ------------------------------------------------------------- result = client.predict( message={"text": "Give me a one-sentence hello.", "files": []}, max_new_tokens=256, temperature=0.7, api_name="/chat", ) print("TEXT ->", result) # --- image + text ---------------------------------------------------------- # result = client.predict( # message={ # "text": "Describe this image.", # "files": [handle_file("https://gradio-builds.s3.amazonaws.com/demo-files/cheetah.jpg")], # }, # max_new_tokens=256, # temperature=0.7, # api_name="/chat", # ) # print("VISION ->", result)