Revert "Fix RTX 5090 crash: use sdpa attention instead of sageattn"
Some checks failed
Build and Push Docker Image / build (push) Has been cancelled
Some checks failed
Build and Push Docker Image / build (push) Has been cancelled
This reverts commit 1e60401679.
This commit is contained in:
@@ -83,7 +83,7 @@
|
|||||||
"base_precision": "fp16_fast",
|
"base_precision": "fp16_fast",
|
||||||
"quantization": "disabled",
|
"quantization": "disabled",
|
||||||
"load_device": "offload_device",
|
"load_device": "offload_device",
|
||||||
"attention_mode": "sdpa",
|
"attention_mode": "sageattn",
|
||||||
"rms_norm_function": "default",
|
"rms_norm_function": "default",
|
||||||
"block_swap_args": [
|
"block_swap_args": [
|
||||||
"128",
|
"128",
|
||||||
@@ -101,7 +101,7 @@
|
|||||||
"base_precision": "fp16_fast",
|
"base_precision": "fp16_fast",
|
||||||
"quantization": "disabled",
|
"quantization": "disabled",
|
||||||
"load_device": "offload_device",
|
"load_device": "offload_device",
|
||||||
"attention_mode": "sdpa",
|
"attention_mode": "sageattn",
|
||||||
"rms_norm_function": "default",
|
"rms_norm_function": "default",
|
||||||
"block_swap_args": [
|
"block_swap_args": [
|
||||||
"128",
|
"128",
|
||||||
|
|||||||
Reference in New Issue
Block a user