1 file changed
+1
-1
lines changedSubmodule cudnn-frontend updated 40 files
- CMakeLists.txt+1-1
 - include/cudnn_frontend/backend/backend_descriptor.h+2-2
 - include/cudnn_frontend/backend/device_properties.h+16-16
 - include/cudnn_frontend/backend/execution_helpers.h+8-8
 - include/cudnn_frontend/backend/kernel_cache.h+13-13
 - include/cudnn_frontend/backend/plan_helpers.h+56-56
 - include/cudnn_frontend/graph_helpers.h+2-2
 - include/cudnn_frontend/graph_interface.h+128-82
 - include/cudnn_frontend/graph_properties.h+124-146
 - include/cudnn_frontend/node/adaptive_layernorm.h+95-95
 - include/cudnn_frontend/node/block_scale_dequantize.h+27-27
 - include/cudnn_frontend/node/block_scale_quantize.h+27-27
 - include/cudnn_frontend/node/concatenate.h+21-21
 - include/cudnn_frontend/node/matmul_fp8.h+6-2
 - include/cudnn_frontend/node/paged_cache_load.h+12-8
 - include/cudnn_frontend/node/scaled_dot_product_flash_attention.h+277-341
 - include/cudnn_frontend/node/sdpa_fp8_bwd.h+19-2
 - include/cudnn_frontend/node/sdpa_support_surface.h+467
 - include/cudnn_frontend/node_interface.h+2-2
 - include/cudnn_frontend/plans.h+1-1
 - include/cudnn_frontend/utils/serialize.h+10-31
 - include/cudnn_frontend_utils.h+10-1
 - include/cudnn_frontend_version.h+1-1
 - python/cudnn/__init__.py+9-2
 - python/properties.cpp+46
 - python/pygraph/pygraph.cpp+28-6
 - python/pygraph/pygraph.h+59-5
 - python/pygraph/sdpa.cpp+319-132
 - samples/README.md+7-1
 - samples/cpp/matmul/blackwell_nvfp4_mxfp8_block_scale_matmul.cpp+1-1
 - samples/cpp/matmul/general_block_scale_matmul.cpp+1-1
 - samples/cpp/misc/custom_plan.cpp+5-3
 - samples/cpp/misc/deviceless_aot_compilation.cpp+5-5
 - samples/legacy_samples/utils/error_util.h-192
 - samples/python/33_layernorm_forward_training_and_backward_with_relu_bitmask.ipynb+583
 - samples/python/52_scaled_dot_product_attention_with_paged_caches.ipynb+233-61
 - samples/python/53_scaled_dot_product_attention_decode_with_paged_caches.ipynb+486
 - test/cpp/serialize.cpp+1-2
 - test/python/test_deviceless_aot_compilation.py+104
 - test/python/test_low_precision_matmul.py+4-4
 
0 commit comments