엄한솔
01/16/2023, 7:46 AM@bentoml.Runnable.method(batchable=True)
def infer_batch(self, data):
data = data.to_dict(orient="records")
infer_input = [d.get("image_url") for d in data]
inferred = inference_urls(model, urls)
return inferred
shot_runner = bentoml.Runner(
ShotRunnable,
runnable_init_params={"domain": domain},
name=f"Runner",
max_batch_size=32,
max_latency_ms=10000,
)