Cycles: Some more inline policy tweaks for CUDA 8

Makes it so toolkit does exactly the same decision about what to inline,
but unfortunately it has really barely visible difference on GTX-980.
This commit is contained in:
Sergey Sharybin 2016-08-02 15:04:34 +02:00
parent b416168d85
commit 500e0e9a3d
5 changed files with 55 additions and 25 deletions

@ -144,7 +144,16 @@ ccl_device_inline int bsdf_sample(KernelGlobals *kg,
return label;
}
ccl_device float3 bsdf_eval(KernelGlobals *kg, ShaderData *sd, const ShaderClosure *sc, const float3 omega_in, float *pdf)
#ifndef __KERNEL_CUDS__
ccl_device
#else
ccl_device_inline
#endif
float3 bsdf_eval(KernelGlobals *kg,
ShaderData *sd,
const ShaderClosure *sc,
const float3 omega_in,
float *pdf)
{
float3 eval;

@ -18,7 +18,7 @@ CCL_NAMESPACE_BEGIN
#ifdef __BRANCHED_PATH__
ccl_device void kernel_branched_path_ao(KernelGlobals *kg,
ccl_device_inline void kernel_branched_path_ao(KernelGlobals *kg,
ShaderData *sd,
ShaderData *emission_sd,
PathRadiance *L,

@ -149,7 +149,12 @@ ccl_device_noinline void shader_setup_from_ray(KernelGlobals *kg,
/* ShaderData setup from BSSRDF scatter */
#ifdef __SUBSURFACE__
ccl_device void shader_setup_from_subsurface(
# ifndef __KERNEL_CUDS__
ccl_device
# else
ccl_device_inline
# endif
void shader_setup_from_subsurface(
KernelGlobals *kg,
ShaderData *sd,
const Intersection *isect,
@ -533,7 +538,13 @@ ccl_device_inline void _shader_bsdf_multi_eval_branched(KernelGlobals *kg,
}
#endif
ccl_device void shader_bsdf_eval(KernelGlobals *kg,
#ifndef __KERNEL_CUDS__
ccl_device
#else
ccl_device_inline
#endif
void shader_bsdf_eval(KernelGlobals *kg,
ShaderData *sd,
const float3 omega_in,
BsdfEval *eval,

@ -87,7 +87,12 @@ ccl_device void svm_node_attr(KernelGlobals *kg, ShaderData *sd, float *stack, u
}
}
ccl_device void svm_node_attr_bump_dx(KernelGlobals *kg, ShaderData *sd, float *stack, uint4 node)
#ifndef __KERNEL_CUDS__
ccl_device
#else
ccl_device_noinline
#endif
void svm_node_attr_bump_dx(KernelGlobals *kg, ShaderData *sd, float *stack, uint4 node)
{
NodeAttributeType type, mesh_type;
AttributeElement elem;
@ -123,7 +128,12 @@ ccl_device void svm_node_attr_bump_dx(KernelGlobals *kg, ShaderData *sd, float *
}
}
ccl_device void svm_node_attr_bump_dy(KernelGlobals *kg,
#ifndef __KERNEL_CUDS__
ccl_device
#else
ccl_device_noinline
#endif
void svm_node_attr_bump_dy(KernelGlobals *kg,
ShaderData *sd,
float *stack,
uint4 node)

@ -34,7 +34,7 @@ CCL_NAMESPACE_BEGIN
/* Wireframe Node */
ccl_device float wireframe(KernelGlobals *kg,
ccl_device_inline float wireframe(KernelGlobals *kg,
ShaderData *sd,
float size,
int pixel_size,