subprocess.CalledProcessError: Command '['H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\runtime\tcc\tcc.exe', 'C:\Users\Administrator\AppData\Local\Temp\tmp7d7gbzqe\cuda_utils.c', '-O3', '-shared', '-Wno-psabi', '-o', 'C:\Users\Administrator\AppData\Local\Temp\tmp7d7gbzqe\cuda_utils.cp312-win_amd64.pyd', '-fPIC', '-D_Py_USE_GCC_BUILTIN_ATOMICS', '-lcuda', '-lpython312', '-LH:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\backends\nvidia\lib', '-LC:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v12.8\lib\x64', '-IH:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\backends\nvidia\include', '-IC:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v12.8\include', '-IC:\Users\Administrator\AppData\Local\Temp\tmp7d7gbzqe', '-IH:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Include']' returned non-zero exit status 1.
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\execution.py", line 534, in execute
output_data, output_ui, has_subgraph, has_pending_tasks = await get_output_data(prompt_id, unique_id, obj, input_data_all, execution_block_cb=execution_block_cb, pre_execute_cb=pre_execute_cb, v3_data=v3_data)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\execution.py", line 334, in get_output_data
return_values = await _async_map_node_over_list(prompt_id, unique_id, obj, input_data_all, obj.FUNCTION, allow_interrupt=True, execution_block_cb=execution_block_cb, pre_execute_cb=pre_execute_cb, v3_data=v3_data)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\custom_nodes\comfyui-lora-manager\py\metadata_collector\metadata_hook.py", line 171, in async_map_node_over_list_with_metadata
results = await original_map_node_over_list(
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\execution.py", line 308, in _async_map_node_over_list
await process_inputs(input_dict, i)
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\execution.py", line 296, in process_inputs
result = f(**inputs)
^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\custom_nodes\ComfyUI-Trellis2\nodes.py", line 4233, in process
mesh = pipeline.decode_latent(shape_slat, texture_slat, resolution, use_tiled=use_tiled_decoder)[0]
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\torch\utils_contextlib.py", line 120, in decorate_context
return func(*args, **kwargs)
^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\custom_nodes\ComfyUI-Trellis2\trellis2\pipelines\trellis2_image_to_3d.py", line 1036, in decode_latent
meshes, subs = self.decode_shape_slat(shape_slat, resolution, use_tiled=use_tiled)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\custom_nodes\ComfyUI-Trellis2\trellis2\pipelines\trellis2_image_to_3d.py", line 916, in decode_shape_slat
ret = self.models['shape_slat_decoder'](slat, return_subs=True, useTiled=use_tiled)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\torch\nn\modules\module.py", line 1773, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\torch\nn\modules\module.py", line 1784, in _call_impl
return forward_call(*args, **kwargs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\custom_nodes\ComfyUI-Trellis2\trellis2\models\sc_vaes\fdg_vae.py", line 94, in forward
decoded = super().forward(x, **kwargs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\custom_nodes\ComfyUI-Trellis2\trellis2\models\sc_vaes\sparse_unet_vae.py", line 681, in forward
h = block(h)
^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\torch\nn\modules\module.py", line 1773, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\torch\nn\modules\module.py", line 1784, in _call_impl
return forward_call(*args, **kwargs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\custom_nodes\ComfyUI-Trellis2\trellis2\models\sc_vaes\sparse_unet_vae.py", line 408, in forward
return self._forward(x)
^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\custom_nodes\ComfyUI-Trellis2\trellis2\models\sc_vaes\sparse_unet_vae.py", line 395, in _forward
h = self.conv(x)
^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\torch\nn\modules\module.py", line 1773, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\torch\nn\modules\module.py", line 1784, in _call_impl
return forward_call(*args, **kwargs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\custom_nodes\ComfyUI-Trellis2\trellis2\modules\sparse\conv\conv.py", line 19, in forward
return _backends[config.CONV].sparse_conv3d_forward(self, x)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\custom_nodes\ComfyUI-Trellis2\trellis2\modules\sparse\conv\conv_flex_gemm.py", line 46, in sparse_conv3d_forward
out, neighbor_cache_ = sparse_submanifold_conv3d(
^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\flex_gemm\ops\spconv\submanifold_conv3d.py", line 372, in sparse_submanifold_conv3d
return SubMConv3dFunction.apply(feats, coords, shape, neighbor_cache, weight, bias, dilation)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\torch\autograd\function.py", line 576, in apply
return super().apply(*args, **kwargs) # type: ignore[misc]
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\flex_gemm\ops\spconv\submanifold_conv3d.py", line 321, in forward
output = SubMConv3dFunction._sparse_submanifold_conv_forward(feats, neighbor_cache, weight, bias)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\flex_gemm\ops\spconv\submanifold_conv3d.py", line 166, in _sparse_submanifold_conv_forward
output = kernels.triton.sparse_submanifold_conv_fwd_implicit_gemm_splitk(
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\flex_gemm\utils\autotuner.py", line 256, in call
best_config = self._benchmark(args, kwargs, configs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\flex_gemm\utils\autotuner.py", line 277, in _benchmark
self.kernel(*args, **kwargs, **config)
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\flex_gemm\kernels\triton\spconv\sparse_submanifold_conv_fwd_implicit_gemm_splitk.py", line 133, in sparse_submanifold_conv_fwd_implicit_gemm_splitk
sparse_submanifold_conv_fwd_implicit_gemm_kernel[grid](
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\runtime\jit.py", line 390, in
return lambda *args, **kwargs: self.run(grid=grid, warmup=False, *args, **kwargs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\flex_gemm\utils\autotuner.py", line 67, in run
timings = {config: self._bench(*args, config=config, **kwargs) for config in pruned_configs}
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\runtime\autotuner.py", line 160, in _bench
return self.do_bench(kernel_call, quantiles=(0.5, 0.2, 0.8))
^^^^^^^^^^^^^
File "functools.py", line 998, in get
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\runtime\autotuner.py", line 121, in do_bench
return driver.active.get_benchmarker()
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\runtime\driver.py", line 30, in getattr
return getattr(self._initialize_obj(), name)
^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\runtime\driver.py", line 26, in _initialize_obj
self._obj = self._init_fn()
^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\runtime\driver.py", line 12, in _create_driver
return active_drivers0
^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\backends\nvidia\driver.py", line 751, in init
self.utils = CudaUtils() # TODO: make static
^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\backends\nvidia\driver.py", line 68, in init
mod = compile_module_from_src(
^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\runtime\build.py", line 162, in compile_module_from_src
so = _build(name, src_path, tmpdir, library_dirs or [], include_dirs or [], libraries or [])
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\runtime\build.py", line 122, in _build
raise e
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\runtime\build.py", line 119, in _build
subprocess.check_call(cc_cmd)
File "subprocess.py", line 413, in check_call
subprocess.CalledProcessError: Command '['H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\runtime\tcc\tcc.exe', 'C:\Users\Administrator\AppData\Local\Temp\tmp7d7gbzqe\cuda_utils.c', '-O3', '-shared', '-Wno-psabi', '-o', 'C:\Users\Administrator\AppData\Local\Temp\tmp7d7gbzqe\cuda_utils.cp312-win_amd64.pyd', '-fPIC', '-D_Py_USE_GCC_BUILTIN_ATOMICS', '-lcuda', '-lpython312', '-LH:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\backends\nvidia\lib', '-LC:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v12.8\lib\x64', '-IH:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\backends\nvidia\include', '-IC:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v12.8\include', '-IC:\Users\Administrator\AppData\Local\Temp\tmp7d7gbzqe', '-IH:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Include']' returned non-zero exit status 1.
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\execution.py", line 534, in execute
output_data, output_ui, has_subgraph, has_pending_tasks = await get_output_data(prompt_id, unique_id, obj, input_data_all, execution_block_cb=execution_block_cb, pre_execute_cb=pre_execute_cb, v3_data=v3_data)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\execution.py", line 334, in get_output_data
return_values = await _async_map_node_over_list(prompt_id, unique_id, obj, input_data_all, obj.FUNCTION, allow_interrupt=True, execution_block_cb=execution_block_cb, pre_execute_cb=pre_execute_cb, v3_data=v3_data)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\custom_nodes\comfyui-lora-manager\py\metadata_collector\metadata_hook.py", line 171, in async_map_node_over_list_with_metadata
results = await original_map_node_over_list(
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\execution.py", line 308, in _async_map_node_over_list
await process_inputs(input_dict, i)
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\execution.py", line 296, in process_inputs
result = f(**inputs)
^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\custom_nodes\ComfyUI-Trellis2\nodes.py", line 4233, in process
mesh = pipeline.decode_latent(shape_slat, texture_slat, resolution, use_tiled=use_tiled_decoder)[0]
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\torch\utils_contextlib.py", line 120, in decorate_context
return func(*args, **kwargs)
^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\custom_nodes\ComfyUI-Trellis2\trellis2\pipelines\trellis2_image_to_3d.py", line 1036, in decode_latent
meshes, subs = self.decode_shape_slat(shape_slat, resolution, use_tiled=use_tiled)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\custom_nodes\ComfyUI-Trellis2\trellis2\pipelines\trellis2_image_to_3d.py", line 916, in decode_shape_slat
ret = self.models['shape_slat_decoder'](slat, return_subs=True, useTiled=use_tiled)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\torch\nn\modules\module.py", line 1773, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\torch\nn\modules\module.py", line 1784, in _call_impl
return forward_call(*args, **kwargs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\custom_nodes\ComfyUI-Trellis2\trellis2\models\sc_vaes\fdg_vae.py", line 94, in forward
decoded = super().forward(x, **kwargs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\custom_nodes\ComfyUI-Trellis2\trellis2\models\sc_vaes\sparse_unet_vae.py", line 681, in forward
h = block(h)
^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\torch\nn\modules\module.py", line 1773, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\torch\nn\modules\module.py", line 1784, in _call_impl
return forward_call(*args, **kwargs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\custom_nodes\ComfyUI-Trellis2\trellis2\models\sc_vaes\sparse_unet_vae.py", line 408, in forward
return self._forward(x)
^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\custom_nodes\ComfyUI-Trellis2\trellis2\models\sc_vaes\sparse_unet_vae.py", line 395, in _forward
h = self.conv(x)
^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\torch\nn\modules\module.py", line 1773, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\torch\nn\modules\module.py", line 1784, in _call_impl
return forward_call(*args, **kwargs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\custom_nodes\ComfyUI-Trellis2\trellis2\modules\sparse\conv\conv.py", line 19, in forward
return _backends[config.CONV].sparse_conv3d_forward(self, x)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\ComfyUI\custom_nodes\ComfyUI-Trellis2\trellis2\modules\sparse\conv\conv_flex_gemm.py", line 46, in sparse_conv3d_forward
out, neighbor_cache_ = sparse_submanifold_conv3d(
^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\flex_gemm\ops\spconv\submanifold_conv3d.py", line 372, in sparse_submanifold_conv3d
return SubMConv3dFunction.apply(feats, coords, shape, neighbor_cache, weight, bias, dilation)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\torch\autograd\function.py", line 576, in apply
return super().apply(*args, **kwargs) # type: ignore[misc]
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\flex_gemm\ops\spconv\submanifold_conv3d.py", line 321, in forward
output = SubMConv3dFunction._sparse_submanifold_conv_forward(feats, neighbor_cache, weight, bias)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\flex_gemm\ops\spconv\submanifold_conv3d.py", line 166, in _sparse_submanifold_conv_forward
output = kernels.triton.sparse_submanifold_conv_fwd_implicit_gemm_splitk(
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\flex_gemm\utils\autotuner.py", line 256, in call
best_config = self._benchmark(args, kwargs, configs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\flex_gemm\utils\autotuner.py", line 277, in _benchmark
self.kernel(*args, **kwargs, **config)
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\flex_gemm\kernels\triton\spconv\sparse_submanifold_conv_fwd_implicit_gemm_splitk.py", line 133, in sparse_submanifold_conv_fwd_implicit_gemm_splitk
sparse_submanifold_conv_fwd_implicit_gemm_kernel[grid](
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\runtime\jit.py", line 390, in
return lambda *args, **kwargs: self.run(grid=grid, warmup=False, *args, **kwargs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\flex_gemm\utils\autotuner.py", line 67, in run
timings = {config: self._bench(*args, config=config, **kwargs) for config in pruned_configs}
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\runtime\autotuner.py", line 160, in _bench
return self.do_bench(kernel_call, quantiles=(0.5, 0.2, 0.8))
^^^^^^^^^^^^^
File "functools.py", line 998, in get
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\runtime\autotuner.py", line 121, in do_bench
return driver.active.get_benchmarker()
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\runtime\driver.py", line 30, in getattr
return getattr(self._initialize_obj(), name)
^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\runtime\driver.py", line 26, in _initialize_obj
self._obj = self._init_fn()
^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\runtime\driver.py", line 12, in _create_driver
return active_drivers0
^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\backends\nvidia\driver.py", line 751, in init
self.utils = CudaUtils() # TODO: make static
^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\backends\nvidia\driver.py", line 68, in init
mod = compile_module_from_src(
^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\runtime\build.py", line 162, in compile_module_from_src
so = _build(name, src_path, tmpdir, library_dirs or [], include_dirs or [], libraries or [])
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\runtime\build.py", line 122, in _build
raise e
File "H:\AI\comfyui\ComfyUI_pytroch28cu128\python_embeded\Lib\site-packages\triton\runtime\build.py", line 119, in _build
subprocess.check_call(cc_cmd)
File "subprocess.py", line 413, in check_call