diff --git a/docs/how_to/tutorials/e2e_opt_model.py b/docs/how_to/tutorials/e2e_opt_model.py index 9f89e744a362..8307ddc4f299 100644 --- a/docs/how_to/tutorials/e2e_opt_model.py +++ b/docs/how_to/tutorials/e2e_opt_model.py @@ -113,12 +113,14 @@ # We skip this step in the CI environment. if not IS_IN_CI: - ex = tvm.compile(mod, target="cuda") + with target: + mod = tvm.tir.transform.DefaultGPUSchedule()(mod) + ex = tvm.compile(mod, target=target) dev = tvm.device("cuda", 0) vm = relax.VirtualMachine(ex, dev) # Need to allocate data and params on GPU device gpu_data = tvm.runtime.tensor(np.random.rand(1, 3, 224, 224).astype("float32"), dev) gpu_params = [tvm.runtime.tensor(p, dev) for p in params["main"]] - gpu_out = vm["main"](gpu_data, *gpu_params).numpy() + gpu_out = vm["main"](gpu_data, *gpu_params)[0].numpy() print(gpu_out.shape)