|  |  | @ -50,10 +50,6 @@ void NCCLAllReduceOpHandle::RunImpl() { | 
			
		
	
		
		
			
				
					
					|  |  |  | 
 |  |  |  | 
 | 
			
		
	
		
		
			
				
					
					|  |  |  |       auto &lod_tensor = s->FindVar(var_name)->Get<LoDTensor>(); |  |  |  |       auto &lod_tensor = s->FindVar(var_name)->Get<LoDTensor>(); | 
			
		
	
		
		
			
				
					
					|  |  |  |       void *buffer = const_cast<void *>(lod_tensor.data<void>()); |  |  |  |       void *buffer = const_cast<void *>(lod_tensor.data<void>()); | 
			
		
	
		
		
			
				
					
					|  |  |  |       uintptr_t buf = reinterpret_cast<uintptr_t>(buffer); |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |       if (buf % sizeof(float) != 0) { |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         VLOG(3) << "Buffer is not aligned " << buf; |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |       } |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  | 
 |  |  |  | 
 | 
			
		
	
		
		
			
				
					
					|  |  |  |       if (dtype == -1) { |  |  |  |       if (dtype == -1) { | 
			
		
	
		
		
			
				
					
					|  |  |  |         dtype = platform::ToNCCLDataType(lod_tensor.type()); |  |  |  |         dtype = platform::ToNCCLDataType(lod_tensor.type()); | 
			
		
	
	
		
		
			
				
					|  |  | 
 |