File tree Expand file tree Collapse file tree 2 files changed +8
-3
lines changed Expand file tree Collapse file tree 2 files changed +8
-3
lines changed Original file line number Diff line number Diff line change 3838  FetchContent_Declare(
3939          vllm-flash-attn
4040          GIT_REPOSITORY https://github.com/vllm-project/flash-attention.git
41-           GIT_TAG 720c94869cf2e0ff5a706e9c7f1dce0939686ade 
41+           GIT_TAG 9bfa9869829d8c593527eb34c5271d0090f7ccc9  
4242          GIT_PROGRESS TRUE 
4343          # Don't share the vllm-flash-attn build between build types 
4444          BINARY_DIR ${CMAKE_BINARY_DIR} /vllm-flash-attn
@@ -64,4 +64,4 @@ install(
6464  DESTINATION  vllm_flash_attn
6565  COMPONENT  _vllm_fa3_C
6666  FILES_MATCHING PATTERN "*.py" 
67- )
67+ )
Original file line number Diff line number Diff line change @@ -595,14 +595,19 @@ def get_flash_attn_version():
595595        # if hopper default to FA3, otherwise stick to FA2 for now 
596596        # TODO(lucas): profile FA3 on ampere to see if it makes sense to 
597597        #  use FA3 as default for both 
598-         if  current_platform .get_device_capability ()[0 ] > =  9 :
598+         if  current_platform .get_device_capability ()[0 ] = =  9 :
599599            fa_version  =  3  if  is_fa_version_supported (3 ) else  2 
600600        else :
601601            fa_version  =  2 
602602
603603        if  envs .VLLM_FLASH_ATTN_VERSION  is  not   None :
604604            assert  envs .VLLM_FLASH_ATTN_VERSION  in  [2 , 3 ]
605605            fa_version  =  envs .VLLM_FLASH_ATTN_VERSION 
606+             if  (current_platform .get_device_capability ()[0 ] ==  10 
607+                     and  envs .VLLM_FLASH_ATTN_VERSION  ==  3 ):
608+                 logger .warning ("Cannot use FA version 3 on Blackwell platform" ,
609+                                "defaulting to FA version 2." )
610+                 fa_version  =  2 
606611
607612        if  not  is_fa_version_supported (fa_version ):
608613            logger .error ("Cannot use FA version %d is not supported due to %s" ,
    
 
   
 
     
   
   
          
     
  
    
     
 
    
      
     
 
     
    You can’t perform that action at this time.
  
 
    
  
     
    
      
        
     
 
       
      
     
   
 
    
    
  
 
  
 
     
    
0 commit comments