Revert "[cuDNN] Enable cuDNN Frontend v8 API by Default (pytorch#84948)"

pytorchmergebot · pytorchmergebot · commit 746500d58d90 · 2022-10-14T14:25:51.000Z
This reverts commit 427e0a6. Reverted pytorch#84948 on behalf of https://github.com/malfet due to Broke SM86 sanity
diff --git a/aten/src/ATen/native/ConvUtils.h b/aten/src/ATen/native/ConvUtils.h
@@ -66,11 +66,11 @@ namespace {
 }
 
 static inline bool cudnnv8_enabled_check_debug() {
-  static bool cudnnv8_flag = c10::utils::check_env("TORCH_CUDNN_V8_API_DISABLED") != true;
+  static bool cudnnv8_flag = c10::utils::check_env("TORCH_CUDNN_V8_API_ENABLED") == true;
   static bool cudnnv8_debug = c10::utils::check_env("TORCH_CUDNN_V8_API_DEBUG") == true;
   static uint8_t cudnnv8_debugcount = 0;
   if (cudnnv8_debug == 1 && cudnnv8_debugcount < 10) {
-    TORCH_WARN("TORCH_CUDNN_V8_DEBUG ON, V8 ON: ", cudnnv8_flag, " TORCH_CUDNN_USE_HEURISTIC_MODE B: ", cudnnv8_heuristic_mode_b);
+    TORCH_WARN("TORCH_CUDNN_V8_DEBUG ON, V8_FLAG: ", cudnnv8_flag, " TORCH_CUDNN_USE_HEURISTIC_MODE B: ", cudnnv8_heuristic_mode_b);
     cudnnv8_debugcount++;
   }
   return cudnnv8_flag == 1;
diff --git a/aten/src/ATen/native/cudnn/ConvShared.h b/aten/src/ATen/native/cudnn/ConvShared.h
@@ -113,7 +113,7 @@ void raw_cudnn_convolution_add_relu_fallback_out(
 
 #if HAS_CUDNN_V8()
 // v7 functions are preserved here to allow for runtime switching to v7
-// (e.g., TORCH_CUDNN_V8_API_DISABLED=1).
+// (e.g., TORCH_CUDNN_V8_API_ENABLED=0).
 // Note that v7 forward/backward out can have different behavior from the v8
 // versions, as v7 explicitly splits large tensors as a 32-bit indexing
 // workaround whereas v8 expects cuDNN to handle large tensors.
diff --git a/test/test_cuda.py b/test/test_cuda.py
@@ -2894,10 +2894,10 @@ def test_autocast_torch_bf16(self):
                 op, args = op_with_args[0], op_with_args[1]
                 if len(op_with_args) == 3:
                     skip_test = op_with_args[2]  # TEST_WITH_ROCM
-                should_error_from_cudnn = 'cudnn' in op and \
-                    ('TORCH_CUDNN_V8_API_DISABLED' in os.environ and
-                     int(os.environ['TORCH_CUDNN_V8_API_DISABLED']) or
-                     torch.cuda.get_device_capability() < (8, 0))
+                should_error_from_cudnn = 'cudnn' in op and not\
+                    ('TORCH_CUDNN_V8_API_ENABLED' in os.environ and
+                     int(os.environ['TORCH_CUDNN_V8_API_ENABLED']) and
+                     torch.cuda.get_device_capability() >= (8, 0))
                 should_error_from_not_implemented = should_error_from_cudnn or 'prelu' in op or 'thnn' in op \
                     or 'fused' in op or 'gru' in op or op == '_thnn_fused_lstm_cell' or op == 'lstm_cell'
                 if not skip_test:

Original file line number	Diff line number	Diff line change
`@@ -66,11 +66,11 @@ namespace {`
`66`	`66`	`}`
`67`	`67`
`68`	`68`	`static inline bool cudnnv8_enabled_check_debug() {`
`69`		`- static bool cudnnv8_flag = c10::utils::check_env("TORCH_CUDNN_V8_API_DISABLED") != true;`
	`69`	`+ static bool cudnnv8_flag = c10::utils::check_env("TORCH_CUDNN_V8_API_ENABLED") == true;`
`70`	`70`	`static bool cudnnv8_debug = c10::utils::check_env("TORCH_CUDNN_V8_API_DEBUG") == true;`
`71`	`71`	`static uint8_t cudnnv8_debugcount = 0;`
`72`	`72`	`if (cudnnv8_debug == 1 && cudnnv8_debugcount < 10) {`
`73`		`- TORCH_WARN("TORCH_CUDNN_V8_DEBUG ON, V8 ON: ", cudnnv8_flag, " TORCH_CUDNN_USE_HEURISTIC_MODE B: ", cudnnv8_heuristic_mode_b);`
	`73`	`+ TORCH_WARN("TORCH_CUDNN_V8_DEBUG ON, V8_FLAG: ", cudnnv8_flag, " TORCH_CUDNN_USE_HEURISTIC_MODE B: ", cudnnv8_heuristic_mode_b);`
`74`	`74`	`cudnnv8_debugcount++;`
`75`	`75`	`}`
`76`	`76`	`return cudnnv8_flag == 1;`