| 
									
										
										
										
											2011-11-15 15:13:38 +00:00
										 |  |  | /*
 | 
					
						
							| 
									
										
										
										
											2013-08-18 14:16:15 +00:00
										 |  |  |  * Copyright 2011-2013 Blender Foundation | 
					
						
							| 
									
										
										
										
											2011-11-15 15:13:38 +00:00
										 |  |  |  * | 
					
						
							| 
									
										
										
										
											2013-08-18 14:16:15 +00:00
										 |  |  |  * Licensed under the Apache License, Version 2.0 (the "License"); | 
					
						
							|  |  |  |  * you may not use this file except in compliance with the License. | 
					
						
							|  |  |  |  * You may obtain a copy of the License at | 
					
						
							| 
									
										
										
										
											2011-11-15 15:13:38 +00:00
										 |  |  |  * | 
					
						
							| 
									
										
										
										
											2013-08-18 14:16:15 +00:00
										 |  |  |  * http://www.apache.org/licenses/LICENSE-2.0
 | 
					
						
							| 
									
										
										
										
											2011-11-15 15:13:38 +00:00
										 |  |  |  * | 
					
						
							| 
									
										
										
										
											2013-08-18 14:16:15 +00:00
										 |  |  |  * Unless required by applicable law or agreed to in writing, software | 
					
						
							|  |  |  |  * distributed under the License is distributed on an "AS IS" BASIS, | 
					
						
							|  |  |  |  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | 
					
						
							|  |  |  |  * See the License for the specific language governing permissions and | 
					
						
							|  |  |  |  * limitations under the License | 
					
						
							| 
									
										
										
										
											2011-11-15 15:13:38 +00:00
										 |  |  |  */ | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-02-04 18:50:09 +00:00
										 |  |  | /* Optimized CPU kernel entry points. This file is compiled with SSE2
 | 
					
						
							| 
									
										
										
										
											2012-06-09 17:22:52 +00:00
										 |  |  |  * optimization flags and nearly all functions inlined, while kernel.cpp | 
					
						
							|  |  |  |  * is compiled without for other CPU's. */ | 
					
						
							| 
									
										
										
										
											2011-11-15 15:13:38 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | #ifdef WITH_OPTIMIZED_KERNEL
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-10-05 19:56:34 +00:00
										 |  |  | /* SSE optimization disabled for now on 32 bit, see bug #36316 */ | 
					
						
							|  |  |  | #if !(defined(__GNUC__) && (defined(i386) || defined(_M_IX86)))
 | 
					
						
							| 
									
										
										
										
											2013-06-26 23:29:33 +00:00
										 |  |  | #define __KERNEL_SSE2__
 | 
					
						
							| 
									
										
										
										
											2013-10-05 19:56:34 +00:00
										 |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2013-06-26 22:12:23 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2011-11-15 15:13:38 +00:00
										 |  |  | #include "kernel.h"
 | 
					
						
							|  |  |  | #include "kernel_compat_cpu.h"
 | 
					
						
							|  |  |  | #include "kernel_math.h"
 | 
					
						
							|  |  |  | #include "kernel_types.h"
 | 
					
						
							|  |  |  | #include "kernel_globals.h"
 | 
					
						
							|  |  |  | #include "kernel_film.h"
 | 
					
						
							|  |  |  | #include "kernel_path.h"
 | 
					
						
							|  |  |  | #include "kernel_displace.h"
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | CCL_NAMESPACE_BEGIN | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /* Path Tracing */ | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-02-04 16:12:37 +00:00
										 |  |  | void kernel_cpu_sse2_path_trace(KernelGlobals *kg, float *buffer, unsigned int *rng_state, int sample, int x, int y, int offset, int stride) | 
					
						
							| 
									
										
										
										
											2011-11-15 15:13:38 +00:00
										 |  |  | { | 
					
						
							| 
									
										
										
										
											2013-08-23 14:34:34 +00:00
										 |  |  | #ifdef __BRANCHED_PATH__
 | 
					
						
							|  |  |  | 	if(kernel_data.integrator.branched) | 
					
						
							|  |  |  | 		kernel_branched_path_trace(kg, buffer, rng_state, sample, x, y, offset, stride); | 
					
						
							| 
									
										
										
										
											2013-08-09 20:03:49 +00:00
										 |  |  | 	else | 
					
						
							|  |  |  | #endif
 | 
					
						
							| 
									
										
										
										
											2013-08-23 14:34:34 +00:00
										 |  |  | 		kernel_path_trace(kg, buffer, rng_state, sample, x, y, offset, stride); | 
					
						
							| 
									
										
										
										
											2011-11-15 15:13:38 +00:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-08-30 23:49:38 +00:00
										 |  |  | /* Film */ | 
					
						
							| 
									
										
										
										
											2011-11-15 15:13:38 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-08-30 23:49:38 +00:00
										 |  |  | void kernel_cpu_sse2_convert_to_byte(KernelGlobals *kg, uchar4 *rgba, float *buffer, float sample_scale, int x, int y, int offset, int stride) | 
					
						
							| 
									
										
										
										
											2011-11-15 15:13:38 +00:00
										 |  |  | { | 
					
						
							| 
									
										
										
										
											2013-08-30 23:49:38 +00:00
										 |  |  | 	kernel_film_convert_to_byte(kg, rgba, buffer, sample_scale, x, y, offset, stride); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | void kernel_cpu_sse2_convert_to_half_float(KernelGlobals *kg, uchar4 *rgba, float *buffer, float sample_scale, int x, int y, int offset, int stride) | 
					
						
							|  |  |  | { | 
					
						
							|  |  |  | 	kernel_film_convert_to_half_float(kg, rgba, buffer, sample_scale, x, y, offset, stride); | 
					
						
							| 
									
										
										
										
											2011-11-15 15:13:38 +00:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2011-12-31 15:18:13 +00:00
										 |  |  | /* Shader Evaluate */ | 
					
						
							| 
									
										
										
										
											2011-11-15 15:13:38 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-02-04 16:12:37 +00:00
										 |  |  | void kernel_cpu_sse2_shader(KernelGlobals *kg, uint4 *input, float4 *output, int type, int i) | 
					
						
							| 
									
										
										
										
											2011-11-15 15:13:38 +00:00
										 |  |  | { | 
					
						
							| 
									
										
										
										
											2011-12-31 15:18:13 +00:00
										 |  |  | 	kernel_shader_evaluate(kg, input, output, (ShaderEvalType)type, i); | 
					
						
							| 
									
										
										
										
											2011-11-15 15:13:38 +00:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | CCL_NAMESPACE_END | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #endif
 | 
					
						
							|  |  |  | 
 |