mirror of
https://github.com/zebrajr/pytorch.git
synced 2025-12-06 12:20:52 +01:00
[BE]: Update cudnn frontend submodule to 1.14.1 (#162347)
Fixes a few bugs introduced to CUDNN 1.11 which affects all our CUDA13 builds. Also adds support for new CUDNN features whenever we choose to update. @eqy pretty sure this addresses the concern you had over the previous upgrade since that bugfix is now merged. This is a simple header only update. Pull Request resolved: https://github.com/pytorch/pytorch/pull/162347 Approved by: https://github.com/eqy, https://github.com/atalman
This commit is contained in:
parent
8ec01f34e9
commit
ec2c1371af
|
|
@ -482,7 +482,7 @@ auto build_graph(
|
||||||
auto scaled_dot_product_flash_attention_options =
|
auto scaled_dot_product_flash_attention_options =
|
||||||
fe::graph::SDPA_attributes()
|
fe::graph::SDPA_attributes()
|
||||||
.set_name("CUDNN_SDPA")
|
.set_name("CUDNN_SDPA")
|
||||||
.set_is_inference(return_softmaxstats == false)
|
.set_generate_stats(return_softmaxstats)
|
||||||
.set_causal_mask(is_causal)
|
.set_causal_mask(is_causal)
|
||||||
.set_attn_scale(attn_scale);
|
.set_attn_scale(attn_scale);
|
||||||
if (use_ragged_in_dense(q, k, v, o, attn_bias.has_value())) {
|
if (use_ragged_in_dense(q, k, v, o, attn_bias.has_value())) {
|
||||||
|
|
@ -702,7 +702,7 @@ auto build_graph_nestedtensor(
|
||||||
auto scaled_dot_product_flash_attention_options =
|
auto scaled_dot_product_flash_attention_options =
|
||||||
fe::graph::SDPA_attributes()
|
fe::graph::SDPA_attributes()
|
||||||
.set_name("CUDNN_SDPA_NESTEDTENSOR")
|
.set_name("CUDNN_SDPA_NESTEDTENSOR")
|
||||||
.set_is_inference(return_softmaxstats == false)
|
.set_generate_stats(return_softmaxstats)
|
||||||
.set_causal_mask(is_causal)
|
.set_causal_mask(is_causal)
|
||||||
.set_attn_scale(attn_scale)
|
.set_attn_scale(attn_scale)
|
||||||
.set_seq_len_q(SEQ_LEN_Q_)
|
.set_seq_len_q(SEQ_LEN_Q_)
|
||||||
|
|
|
||||||
2
third_party/cudnn_frontend
vendored
2
third_party/cudnn_frontend
vendored
|
|
@ -1 +1 @@
|
||||||
Subproject commit f937055efc6d414d11f4c6577e3977fe74f35fb6
|
Subproject commit 1a7b4b78db44712fb9707d21cd2e3179f1fd88b8
|
||||||
Loading…
Reference in New Issue
Block a user