apparently impossible to compose blended code with would perform satisfactory on all x86 and x86_64 cores, an extra RC4_CHAR code-path is introduced and P4 core is detected at run-time. This way we keep original performance on non-P4 implementations and turbo-charge P4 performance by factor of 2.8x (on 32-bit core).
		
			
				
	
	
		
			6 lines
		
	
	
		
			114 B
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			6 lines
		
	
	
		
			114 B
		
	
	
	
		
			C
		
	
	
	
	
	
#ifndef HEADER_RC4_LOCL_H
 | 
						|
#define HEADER_RC4_LOCL_H
 | 
						|
#include <openssl/opensslconf.h>
 | 
						|
#include <cryptlib.h>
 | 
						|
#endif
 |