A               
*$Dec  3 202420:16:52HOST64sm_86//
// Generated by NVIDIA NVVM Compiler
//
// Compiler Build ID: CL-25769353
// Cuda compilation tools, release 10.1, V10.1.105
// Based on LLVM 3.4svn
//

.version 6.4
.target sm_30
.address_size 64

	// .globl	PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel
.const .align 4 .b8 kRGB32f_To_601YPbPr[36] = {135, 22, 153, 62, 162, 69, 22, 63, 213, 120, 233, 61, 33, 201, 44, 190, 111, 155, 169, 190, 0, 0, 0, 63, 0, 0, 0, 63, 70, 94, 214, 190, 232, 134, 166, 189};
.const .align 4 .b8 k601YPbPr_To_RGB32f[36] = {0, 0, 128, 63, 0, 0, 0, 0, 188, 116, 179, 63, 0, 0, 128, 63, 152, 50, 176, 190, 158, 209, 54, 191, 0, 0, 128, 63, 229, 208, 226, 63, 0, 0, 0, 0};
.const .align 4 .b8 kRGB32f_To_601YCbCr[36] = {70, 246, 130, 66, 145, 141, 0, 67, 94, 186, 199, 65, 33, 48, 23, 194, 240, 103, 148, 194, 0, 0, 224, 66, 0, 0, 224, 66, 111, 146, 187, 194, 70, 182, 145, 193};
.const .align 4 .b8 k601YCbCr_To_RGB32f[36] = {37, 160, 149, 59, 0, 0, 0, 0, 182, 23, 205, 59, 37, 160, 149, 59, 40, 15, 201, 186, 156, 239, 80, 187, 37, 160, 149, 59, 236, 155, 1, 60, 0, 0, 0, 0};
.const .align 4 .b8 kRGB8u_To_601YCbCr[36] = {219, 121, 131, 62, 152, 14, 1, 63, 18, 131, 200, 61, 174, 199, 23, 190, 238, 252, 148, 190, 197, 224, 224, 62, 197, 224, 224, 62, 217, 78, 188, 190, 174, 71, 146, 189};
.const .align 4 .b8 k601YCbCr_To_RGB8u[36] = {127, 10, 149, 63, 0, 0, 0, 0, 160, 74, 204, 63, 127, 10, 149, 63, 254, 148, 200, 190, 184, 30, 80, 191, 127, 10, 149, 63, 78, 26, 1, 64, 0, 0, 0, 0};
.const .align 4 .b8 kRGB8u_To_601YCbCrFullRange[36] = {135, 22, 153, 62, 162, 69, 22, 63, 213, 120, 233, 61, 166, 27, 44, 190, 39, 241, 168, 190, 250, 254, 254, 62, 250, 254, 254, 62, 43, 135, 213, 190, 59, 223, 165, 189};
.const .align 4 .b8 k601YCbCrFullRange_To_RGB8u[36] = {0, 0, 128, 63, 0, 0, 0, 0, 72, 193, 178, 63, 0, 0, 128, 63, 143, 130, 175, 190, 225, 26, 54, 191, 0, 0, 128, 63, 20, 238, 225, 63, 0, 0, 0, 0};
.const .align 4 .b8 kRGB32f_To_601YCbCrFullRange[36] = {113, 125, 152, 66, 92, 175, 21, 67, 92, 143, 232, 65, 158, 111, 43, 194, 49, 72, 168, 194, 0, 0, 254, 66, 0, 0, 254, 66, 170, 177, 212, 194, 88, 57, 165, 193};
.const .align 4 .b8 k601YCbCrFullRange_To_RGB32f[36] = {129, 128, 128, 59, 0, 0, 0, 0, 188, 116, 179, 59, 129, 128, 128, 59, 194, 50, 176, 186, 179, 209, 54, 187, 129, 128, 128, 59, 229, 208, 226, 59, 0, 0, 0, 0};
.const .align 4 .b8 kRGB32f_To_709YPbPr[36] = {208, 179, 89, 62, 89, 23, 55, 63, 152, 221, 147, 61, 186, 164, 234, 189, 210, 86, 197, 190, 0, 0, 0, 63, 0, 0, 0, 63, 190, 134, 232, 190, 16, 202, 59, 189};
.const .align 4 .b8 k709YPbPr_To_RGB32f[36] = {0, 0, 128, 63, 0, 0, 0, 0, 12, 147, 201, 63, 0, 0, 128, 63, 221, 209, 63, 190, 243, 173, 239, 190, 0, 0, 128, 63, 77, 132, 237, 63, 0, 0, 0, 0};
.const .align 4 .b8 kRGB32f_To_709YCbCr[36] = {106, 60, 58, 66, 6, 161, 28, 67, 244, 253, 124, 65, 223, 79, 205, 193, 8, 172, 172, 194, 0, 0, 224, 66, 0, 0, 224, 66, 195, 117, 203, 194, 236, 81, 36, 193};
.const .align 4 .b8 k709YCbCr_To_RGB32f[36] = {37, 160, 149, 59, 0, 0, 0, 0, 239, 94, 230, 59, 37, 160, 149, 59, 33, 57, 91, 186, 178, 245, 8, 187, 37, 160, 149, 59, 82, 185, 7, 60, 0, 0, 0, 0};
.const .align 4 .b8 k709YCbCrFullRange_To_RGB32f[36] = {131, 128, 128, 59, 0, 0, 0, 0, 28, 147, 201, 59, 131, 128, 128, 59, 61, 210, 63, 186, 248, 173, 239, 186, 131, 128, 128, 59, 82, 132, 237, 59, 0, 0, 0, 0};
.const .align 4 .b8 kRGB8u_To_709YCbCr[36] = {207, 247, 58, 62, 53, 62, 29, 63, 231, 251, 125, 61, 184, 30, 206, 189, 23, 89, 173, 190, 197, 224, 224, 62, 197, 224, 224, 62, 12, 66, 204, 190, 195, 245, 36, 189};
.const .align 4 .b8 k709YCbCr_To_RGB8u[36] = {127, 10, 149, 63, 0, 0, 0, 0, 147, 120, 229, 63, 127, 10, 149, 63, 53, 94, 90, 190, 205, 108, 8, 191, 127, 10, 149, 63, 154, 49, 7, 64, 0, 0, 0, 0};
.const .align 4 .b8 k709YCbCr_To_601YCbCr[36] = {0, 0, 128, 63, 23, 100, 203, 61, 1, 77, 68, 62, 0, 0, 0, 0, 18, 103, 125, 63, 10, 158, 226, 189, 0, 0, 0, 0, 61, 98, 148, 189, 249, 191, 123, 63};
.const .align 4 .b8 k601YCbCr_To_709YCbCr[36] = {0, 0, 128, 63, 122, 165, 236, 189, 179, 237, 84, 190, 0, 0, 0, 0, 204, 98, 130, 63, 216, 188, 234, 61, 0, 0, 0, 0, 74, 179, 153, 61, 234, 61, 131, 63};
.const .align 4 .b8 kZeroMatrix[36];
.const .align 4 .b8 kYCbCrOffset[12] = {0, 0, 128, 65, 0, 0, 0, 67, 0, 0, 0, 67};
.const .align 4 .b8 kYCbCrFullRangeOffset[12] = {0, 0, 0, 0, 0, 0, 0, 67, 0, 0, 0, 67};
.const .align 4 .f32 PQ_m1 = 0f3E232000;
.const .align 4 .f32 PQ_m1Inv = 0f40C8E06B;
.const .align 4 .f32 PQ_m2 = 0f429DB000;
.const .align 4 .f32 PQ_m2Inv = 0f3C4FCDAC;
.const .align 4 .f32 PQ_c1 = 0f3F560000;
.const .align 4 .f32 PQ_c2 = 0f4196D000;
.const .align 4 .f32 PQ_c3 = 0f41958000;
.const .align 4 .f32 Gamma1886 = 0f4019999A;
.const .align 4 .f32 PQ_Lpeak = 0f461C4000;
.const .align 4 .f32 PQ_a = 0f3F8CAC08;
.const .align 4 .f32 PQ_b = 0f426E1556;
.const .align 4 .f32 PQ_c = 0f39B033E5;
.const .align 4 .f32 PQ_s = 0f4385EB85;
.const .align 4 .f32 PQ_g = 0f3EE66666;
.const .align 4 .f32 scaleFD = 0f42C80000;
.const .align 4 .f32 HLG_a = 0f3E371FF0;
.const .align 4 .f32 HLG_b = 0f3E91C020;
.const .align 4 .f32 HLG_c = 0f3F0F564F;
.const .align 4 .f32 HLG_inva = 0f40B2F029;
.const .align 4 .f32 HLG_alpha = 0f41200000;
.const .align 4 .f32 HLG_invAlpha = 0f3DCCCCCD;
.const .align 4 .f32 HLG_gamma = 0f3F99999A;
.const .align 4 .f32 HLG_gammaM1 = 0f3E4CCCCD;
.const .align 4 .f32 HLG_gammaM1Dgamma = 0f3E2AAAAB;
.const .align 4 .f32 HLG_YR = 0f3E86809D;
.const .align 4 .f32 HLG_YG = 0f3F2D9168;
.const .align 4 .f32 HLG_YB = 0f3D72E48F;
.const .align 4 .f32 HLG_Lpeak = 0f447A0000;
.const .align 4 .u32 kRandMax = 32767;
// _ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix has been demoted
// _ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix has been demoted
// _ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix has been demoted
// _ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix has been demoted

.visible .entry PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel(
	.param .u64 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_0,
	.param .u64 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_1,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_2,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_3,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_4,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_5,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_6,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_7,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_8,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_9,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_10,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_11,
	.param .align 16 .b8 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_12[16],
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_13,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_14
)
{
	.reg .pred 	%p<34>;
	.reg .b16 	%rs<17>;
	.reg .f32 	%f<307>;
	.reg .b32 	%r<90>;
	.reg .b64 	%rd<77>;
	// demoted variable
	.shared .align 4 .b8 _ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix[36];

	ld.param.u64 	%rd2, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_0];
	ld.param.u64 	%rd3, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_1];
	ld.param.u32 	%r15, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_2];
	ld.param.u32 	%r16, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_3];
	ld.param.u32 	%r17, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_4];
	ld.param.u32 	%r18, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_6];
	ld.param.u32 	%r19, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_7];
	ld.param.u32 	%r20, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_8];
	ld.param.u32 	%r21, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_9];
	ld.param.u32 	%r22, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_10];
	ld.param.u32 	%r23, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_11];
	ld.param.f32 	%f82, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_12+8];
	ld.param.f32 	%f81, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_12+4];
	ld.param.f32 	%f80, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_12];
	ld.param.u32 	%r24, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_13];
	ld.param.u32 	%r25, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel_param_14];
	cvta.to.global.u64 	%rd1, %rd2;
	mov.u32 	%r1, %tid.x;
	mov.u32 	%r2, %tid.y;
	setp.ne.s32	%p1, %r2, 0;
	setp.gt.u32	%p2, %r1, 2;
	or.pred  	%p3, %p1, %p2;
	@%p3 bra 	BB0_2;

	cvt.s64.s32	%rd4, %r24;
	setp.ne.s32	%p4, %r23, 0;
	mul.lo.s32 	%r26, %r1, 3;
	cvt.s64.s32	%rd5, %r26;
	selp.b64	%rd6, 2, 0, %p4;
	add.s64 	%rd7, %rd4, %rd6;
	add.s64 	%rd8, %rd7, %rd5;
	shl.b64 	%rd9, %rd8, 2;
	add.s64 	%rd10, %rd1, %rd9;
	ld.global.f32 	%f84, [%rd10];
	shl.b32 	%r27, %r26, 2;
	mov.u32 	%r28, _ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix;
	add.s32 	%r29, %r28, %r27;
	st.volatile.shared.f32 	[%r29], %f84;
	add.s32 	%r30, %r24, %r26;
	mul.wide.s32 	%rd11, %r30, 4;
	add.s64 	%rd12, %rd1, %rd11;
	ld.global.f32 	%f85, [%rd12+4];
	st.volatile.shared.f32 	[%r29+4], %f85;
	selp.b64	%rd13, 0, 2, %p4;
	add.s64 	%rd14, %rd4, %rd13;
	add.s64 	%rd15, %rd14, %rd5;
	shl.b64 	%rd16, %rd15, 2;
	add.s64 	%rd17, %rd1, %rd16;
	ld.global.f32 	%f86, [%rd17];
	st.volatile.shared.f32 	[%r29+8], %f86;

BB0_2:
	bar.sync 	0;
	mov.u32 	%r31, %ctaid.x;
	mov.u32 	%r32, %ntid.x;
	mad.lo.s32 	%r33, %r32, %r31, %r1;
	shl.b32 	%r3, %r33, 1;
	setp.ge.s32	%p5, %r3, %r21;
	mov.u32 	%r34, %ctaid.y;
	mov.u32 	%r35, %ntid.y;
	mad.lo.s32 	%r36, %r35, %r34, %r2;
	shl.b32 	%r4, %r36, 1;
	setp.ge.s32	%p6, %r4, %r22;
	or.pred  	%p7, %p5, %p6;
	@%p7 bra 	BB0_59;

	cvt.s64.s32	%rd18, %r15;
	add.s32 	%r37, %r22, -1;
	mul.lo.s32 	%r38, %r37, %r16;
	cvt.s64.s32	%rd19, %r38;
	neg.s32 	%r39, %r16;
	setp.eq.s32	%p8, %r17, 0;
	selp.b32	%r40, %r16, %r39, %p8;
	selp.b64	%rd20, 0, %rd19, %p8;
	add.s64 	%rd21, %rd20, %rd18;
	sub.s32 	%r41, %r37, %r4;
	setp.eq.s32	%p9, %r19, 0;
	selp.b32	%r5, %r4, %r41, %p9;
	mul.lo.s32 	%r6, %r4, %r40;
	add.s32 	%r42, %r6, %r3;
	cvt.s64.s32	%rd22, %r42;
	add.s64 	%rd23, %rd22, %rd21;
	shl.b64 	%rd24, %rd23, 2;
	add.s64 	%rd25, %rd1, %rd24;
	ld.global.f32 	%f87, [%rd25];
	mul.ftz.f32 	%f88, %f87, 0f00000000;
	min.ftz.f32 	%f2, %f88, %f80;
	min.ftz.f32 	%f4, %f88, %f81;
	min.ftz.f32 	%f6, %f87, %f82;
	ld.volatile.shared.f32 	%f89, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+24];
	ld.volatile.shared.f32 	%f90, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+28];
	mul.ftz.f32 	%f91, %f4, %f90;
	fma.rn.ftz.f32 	%f92, %f2, %f89, %f91;
	ld.volatile.shared.f32 	%f93, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+32];
	fma.rn.ftz.f32 	%f289, %f6, %f93, %f92;
	setp.eq.s32	%p10, %r25, 0;
	@%p10 bra 	BB0_13;

	setp.ltu.ftz.f32	%p11, %f289, 0f00000000;
	@%p11 bra 	BB0_6;
	bra.uni 	BB0_5;

BB0_6:
	neg.ftz.f32 	%f96, %f289;
	lg2.approx.ftz.f32 	%f97, %f96;
	mul.ftz.f32 	%f98, %f97, 0f3ED55555;
	ex2.approx.ftz.f32 	%f99, %f98;
	neg.ftz.f32 	%f289, %f99;
	bra.uni 	BB0_7;

BB0_13:
	ld.volatile.shared.f32 	%f122, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f123, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+16];
	mul.ftz.f32 	%f124, %f4, %f123;
	fma.rn.ftz.f32 	%f125, %f2, %f122, %f124;
	ld.volatile.shared.f32 	%f126, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f290, %f6, %f126, %f125;
	ld.volatile.shared.f32 	%f127, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix];
	ld.volatile.shared.f32 	%f128, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+4];
	mul.ftz.f32 	%f129, %f4, %f128;
	fma.rn.ftz.f32 	%f130, %f2, %f127, %f129;
	ld.volatile.shared.f32 	%f131, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f291, %f6, %f131, %f130;
	bra.uni 	BB0_14;

BB0_5:
	lg2.approx.ftz.f32 	%f94, %f289;
	mul.ftz.f32 	%f95, %f94, 0f3ED55555;
	ex2.approx.ftz.f32 	%f289, %f95;

BB0_7:
	ld.volatile.shared.f32 	%f100, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f101, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+16];
	mul.ftz.f32 	%f102, %f4, %f101;
	fma.rn.ftz.f32 	%f103, %f2, %f100, %f102;
	ld.volatile.shared.f32 	%f104, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f11, %f6, %f104, %f103;
	setp.ltu.ftz.f32	%p12, %f11, 0f00000000;
	@%p12 bra 	BB0_9;
	bra.uni 	BB0_8;

BB0_9:
	neg.ftz.f32 	%f107, %f11;
	lg2.approx.ftz.f32 	%f108, %f107;
	mul.ftz.f32 	%f109, %f108, 0f3ED55555;
	ex2.approx.ftz.f32 	%f110, %f109;
	neg.ftz.f32 	%f290, %f110;
	bra.uni 	BB0_10;

BB0_8:
	lg2.approx.ftz.f32 	%f105, %f11;
	mul.ftz.f32 	%f106, %f105, 0f3ED55555;
	ex2.approx.ftz.f32 	%f290, %f106;

BB0_10:
	ld.volatile.shared.f32 	%f111, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix];
	ld.volatile.shared.f32 	%f112, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+4];
	mul.ftz.f32 	%f113, %f4, %f112;
	fma.rn.ftz.f32 	%f114, %f2, %f111, %f113;
	ld.volatile.shared.f32 	%f115, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f15, %f6, %f115, %f114;
	setp.ltu.ftz.f32	%p13, %f15, 0f00000000;
	@%p13 bra 	BB0_12;
	bra.uni 	BB0_11;

BB0_12:
	neg.ftz.f32 	%f118, %f15;
	lg2.approx.ftz.f32 	%f119, %f118;
	mul.ftz.f32 	%f120, %f119, 0f3ED55555;
	ex2.approx.ftz.f32 	%f121, %f120;
	neg.ftz.f32 	%f291, %f121;
	bra.uni 	BB0_14;

BB0_11:
	lg2.approx.ftz.f32 	%f116, %f15;
	mul.ftz.f32 	%f117, %f116, 0f3ED55555;
	ex2.approx.ftz.f32 	%f291, %f117;

BB0_14:
	mul.lo.s32 	%r7, %r5, %r18;
	add.s32 	%r8, %r7, %r3;
	setp.eq.s32	%p14, %r20, 0;
	@%p14 bra 	BB0_16;

	cvta.to.global.u64 	%rd26, %rd3;
	mul.wide.s32 	%rd27, %r8, 16;
	add.s64 	%rd28, %rd26, %rd27;
	mov.f32 	%f132, 0f3F800000;
	st.global.v4.f32 	[%rd28], {%f289, %f290, %f291, %f132};
	bra.uni 	BB0_17;

BB0_16:
	cvta.to.global.u64 	%rd29, %rd3;
	// inline asm
	{  cvt.rn.f16.f32 %rs1, %f289;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs2, %f290;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs3, %f291;}

	// inline asm
	mov.f32 	%f136, 0f3F800000;
	// inline asm
	{  cvt.rn.f16.f32 %rs4, %f136;}

	// inline asm
	mul.wide.s32 	%rd30, %r8, 8;
	add.s64 	%rd31, %rd29, %rd30;
	st.global.u16 	[%rd31], %rs1;
	st.global.u16 	[%rd31+2], %rs2;
	st.global.u16 	[%rd31+4], %rs3;
	st.global.u16 	[%rd31+6], %rs4;

BB0_17:
	add.s32 	%r9, %r3, 1;
	add.s32 	%r53, %r6, %r9;
	cvt.s64.s32	%rd32, %r53;
	add.s64 	%rd37, %rd32, %rd21;
	shl.b64 	%rd39, %rd37, 2;
	add.s64 	%rd40, %rd1, %rd39;
	ld.global.f32 	%f137, [%rd40];
	mul.ftz.f32 	%f138, %f137, 0f00000000;
	min.ftz.f32 	%f23, %f138, %f80;
	min.ftz.f32 	%f24, %f137, %f81;
	min.ftz.f32 	%f25, %f138, %f82;
	ld.volatile.shared.f32 	%f139, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+24];
	ld.volatile.shared.f32 	%f140, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+28];
	mul.ftz.f32 	%f141, %f24, %f140;
	fma.rn.ftz.f32 	%f142, %f23, %f139, %f141;
	ld.volatile.shared.f32 	%f143, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+32];
	fma.rn.ftz.f32 	%f294, %f25, %f143, %f142;
	@%p10 bra 	BB0_27;

	setp.ltu.ftz.f32	%p17, %f294, 0f00000000;
	@%p17 bra 	BB0_20;
	bra.uni 	BB0_19;

BB0_20:
	neg.ftz.f32 	%f146, %f294;
	lg2.approx.ftz.f32 	%f147, %f146;
	mul.ftz.f32 	%f148, %f147, 0f3ED55555;
	ex2.approx.ftz.f32 	%f149, %f148;
	neg.ftz.f32 	%f294, %f149;
	bra.uni 	BB0_21;

BB0_27:
	ld.volatile.shared.f32 	%f172, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f173, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+16];
	mul.ftz.f32 	%f174, %f24, %f173;
	fma.rn.ftz.f32 	%f175, %f23, %f172, %f174;
	ld.volatile.shared.f32 	%f176, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f295, %f25, %f176, %f175;
	ld.volatile.shared.f32 	%f177, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix];
	ld.volatile.shared.f32 	%f178, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+4];
	mul.ftz.f32 	%f179, %f24, %f178;
	fma.rn.ftz.f32 	%f180, %f23, %f177, %f179;
	ld.volatile.shared.f32 	%f181, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f296, %f25, %f181, %f180;
	bra.uni 	BB0_28;

BB0_19:
	lg2.approx.ftz.f32 	%f144, %f294;
	mul.ftz.f32 	%f145, %f144, 0f3ED55555;
	ex2.approx.ftz.f32 	%f294, %f145;

BB0_21:
	ld.volatile.shared.f32 	%f150, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f151, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+16];
	mul.ftz.f32 	%f152, %f24, %f151;
	fma.rn.ftz.f32 	%f153, %f23, %f150, %f152;
	ld.volatile.shared.f32 	%f154, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f30, %f25, %f154, %f153;
	setp.ltu.ftz.f32	%p18, %f30, 0f00000000;
	@%p18 bra 	BB0_23;
	bra.uni 	BB0_22;

BB0_23:
	neg.ftz.f32 	%f157, %f30;
	lg2.approx.ftz.f32 	%f158, %f157;
	mul.ftz.f32 	%f159, %f158, 0f3ED55555;
	ex2.approx.ftz.f32 	%f160, %f159;
	neg.ftz.f32 	%f295, %f160;
	bra.uni 	BB0_24;

BB0_22:
	lg2.approx.ftz.f32 	%f155, %f30;
	mul.ftz.f32 	%f156, %f155, 0f3ED55555;
	ex2.approx.ftz.f32 	%f295, %f156;

BB0_24:
	ld.volatile.shared.f32 	%f161, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix];
	ld.volatile.shared.f32 	%f162, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+4];
	mul.ftz.f32 	%f163, %f24, %f162;
	fma.rn.ftz.f32 	%f164, %f23, %f161, %f163;
	ld.volatile.shared.f32 	%f165, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f34, %f25, %f165, %f164;
	setp.ltu.ftz.f32	%p19, %f34, 0f00000000;
	@%p19 bra 	BB0_26;
	bra.uni 	BB0_25;

BB0_26:
	neg.ftz.f32 	%f168, %f34;
	lg2.approx.ftz.f32 	%f169, %f168;
	mul.ftz.f32 	%f170, %f169, 0f3ED55555;
	ex2.approx.ftz.f32 	%f171, %f170;
	neg.ftz.f32 	%f296, %f171;
	bra.uni 	BB0_28;

BB0_25:
	lg2.approx.ftz.f32 	%f166, %f34;
	mul.ftz.f32 	%f167, %f166, 0f3ED55555;
	ex2.approx.ftz.f32 	%f296, %f167;

BB0_28:
	add.s32 	%r10, %r7, %r9;
	@%p14 bra 	BB0_30;

	cvta.to.global.u64 	%rd41, %rd3;
	mul.wide.s32 	%rd42, %r10, 16;
	add.s64 	%rd43, %rd41, %rd42;
	mov.f32 	%f182, 0f3F800000;
	st.global.v4.f32 	[%rd43], {%f294, %f295, %f296, %f182};
	bra.uni 	BB0_31;

BB0_30:
	cvta.to.global.u64 	%rd44, %rd3;
	// inline asm
	{  cvt.rn.f16.f32 %rs5, %f294;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs6, %f295;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs7, %f296;}

	// inline asm
	mov.f32 	%f186, 0f3F800000;
	// inline asm
	{  cvt.rn.f16.f32 %rs8, %f186;}

	// inline asm
	mul.wide.s32 	%rd45, %r10, 8;
	add.s64 	%rd46, %rd44, %rd45;
	st.global.u16 	[%rd46], %rs5;
	st.global.u16 	[%rd46+2], %rs6;
	st.global.u16 	[%rd46+4], %rs7;
	st.global.u16 	[%rd46+6], %rs8;

BB0_31:
	add.s32 	%r61, %r4, 1;
	mul.lo.s32 	%r11, %r61, %r40;
	add.s32 	%r69, %r11, %r3;
	cvt.s64.s32	%rd47, %r69;
	add.s64 	%rd52, %rd47, %rd21;
	shl.b64 	%rd54, %rd52, 2;
	add.s64 	%rd55, %rd1, %rd54;
	ld.global.f32 	%f187, [%rd55];
	mul.ftz.f32 	%f188, %f187, 0f00000000;
	min.ftz.f32 	%f42, %f188, %f80;
	min.ftz.f32 	%f43, %f187, %f81;
	min.ftz.f32 	%f44, %f188, %f82;
	ld.volatile.shared.f32 	%f189, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+24];
	ld.volatile.shared.f32 	%f190, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+28];
	mul.ftz.f32 	%f191, %f43, %f190;
	fma.rn.ftz.f32 	%f192, %f42, %f189, %f191;
	ld.volatile.shared.f32 	%f193, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+32];
	fma.rn.ftz.f32 	%f299, %f44, %f193, %f192;
	@%p10 bra 	BB0_41;

	setp.ltu.ftz.f32	%p23, %f299, 0f00000000;
	@%p23 bra 	BB0_34;
	bra.uni 	BB0_33;

BB0_34:
	neg.ftz.f32 	%f196, %f299;
	lg2.approx.ftz.f32 	%f197, %f196;
	mul.ftz.f32 	%f198, %f197, 0f3ED55555;
	ex2.approx.ftz.f32 	%f199, %f198;
	neg.ftz.f32 	%f299, %f199;
	bra.uni 	BB0_35;

BB0_41:
	ld.volatile.shared.f32 	%f222, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f223, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+16];
	mul.ftz.f32 	%f224, %f43, %f223;
	fma.rn.ftz.f32 	%f225, %f42, %f222, %f224;
	ld.volatile.shared.f32 	%f226, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f300, %f44, %f226, %f225;
	ld.volatile.shared.f32 	%f227, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix];
	ld.volatile.shared.f32 	%f228, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+4];
	mul.ftz.f32 	%f229, %f43, %f228;
	fma.rn.ftz.f32 	%f230, %f42, %f227, %f229;
	ld.volatile.shared.f32 	%f231, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f301, %f44, %f231, %f230;
	bra.uni 	BB0_42;

BB0_33:
	lg2.approx.ftz.f32 	%f194, %f299;
	mul.ftz.f32 	%f195, %f194, 0f3ED55555;
	ex2.approx.ftz.f32 	%f299, %f195;

BB0_35:
	ld.volatile.shared.f32 	%f200, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f201, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+16];
	mul.ftz.f32 	%f202, %f43, %f201;
	fma.rn.ftz.f32 	%f203, %f42, %f200, %f202;
	ld.volatile.shared.f32 	%f204, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f49, %f44, %f204, %f203;
	setp.ltu.ftz.f32	%p24, %f49, 0f00000000;
	@%p24 bra 	BB0_37;
	bra.uni 	BB0_36;

BB0_37:
	neg.ftz.f32 	%f207, %f49;
	lg2.approx.ftz.f32 	%f208, %f207;
	mul.ftz.f32 	%f209, %f208, 0f3ED55555;
	ex2.approx.ftz.f32 	%f210, %f209;
	neg.ftz.f32 	%f300, %f210;
	bra.uni 	BB0_38;

BB0_36:
	lg2.approx.ftz.f32 	%f205, %f49;
	mul.ftz.f32 	%f206, %f205, 0f3ED55555;
	ex2.approx.ftz.f32 	%f300, %f206;

BB0_38:
	ld.volatile.shared.f32 	%f211, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix];
	ld.volatile.shared.f32 	%f212, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+4];
	mul.ftz.f32 	%f213, %f43, %f212;
	fma.rn.ftz.f32 	%f214, %f42, %f211, %f213;
	ld.volatile.shared.f32 	%f215, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f53, %f44, %f215, %f214;
	setp.ltu.ftz.f32	%p25, %f53, 0f00000000;
	@%p25 bra 	BB0_40;
	bra.uni 	BB0_39;

BB0_40:
	neg.ftz.f32 	%f218, %f53;
	lg2.approx.ftz.f32 	%f219, %f218;
	mul.ftz.f32 	%f220, %f219, 0f3ED55555;
	ex2.approx.ftz.f32 	%f221, %f220;
	neg.ftz.f32 	%f301, %f221;
	bra.uni 	BB0_42;

BB0_39:
	lg2.approx.ftz.f32 	%f216, %f53;
	mul.ftz.f32 	%f217, %f216, 0f3ED55555;
	ex2.approx.ftz.f32 	%f301, %f217;

BB0_42:
	selp.b32	%r80, 1, -1, %p9;
	add.s32 	%r81, %r5, %r80;
	mul.lo.s32 	%r12, %r81, %r18;
	add.s32 	%r13, %r12, %r3;
	@%p14 bra 	BB0_44;

	cvta.to.global.u64 	%rd56, %rd3;
	mul.wide.s32 	%rd57, %r13, 16;
	add.s64 	%rd58, %rd56, %rd57;
	mov.f32 	%f232, 0f3F800000;
	st.global.v4.f32 	[%rd58], {%f299, %f300, %f301, %f232};
	bra.uni 	BB0_45;

BB0_44:
	cvta.to.global.u64 	%rd59, %rd3;
	// inline asm
	{  cvt.rn.f16.f32 %rs9, %f299;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs10, %f300;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs11, %f301;}

	// inline asm
	mov.f32 	%f236, 0f3F800000;
	// inline asm
	{  cvt.rn.f16.f32 %rs12, %f236;}

	// inline asm
	mul.wide.s32 	%rd60, %r13, 8;
	add.s64 	%rd61, %rd59, %rd60;
	st.global.u16 	[%rd61], %rs9;
	st.global.u16 	[%rd61+2], %rs10;
	st.global.u16 	[%rd61+4], %rs11;
	st.global.u16 	[%rd61+6], %rs12;

BB0_45:
	add.s32 	%r87, %r11, %r9;
	cvt.s64.s32	%rd62, %r87;
	add.s64 	%rd67, %rd62, %rd21;
	shl.b64 	%rd69, %rd67, 2;
	add.s64 	%rd70, %rd1, %rd69;
	ld.global.f32 	%f237, [%rd70];
	mul.ftz.f32 	%f238, %f237, 0f00000000;
	min.ftz.f32 	%f61, %f237, %f80;
	min.ftz.f32 	%f62, %f238, %f81;
	min.ftz.f32 	%f63, %f238, %f82;
	ld.volatile.shared.f32 	%f239, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+24];
	ld.volatile.shared.f32 	%f240, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+28];
	mul.ftz.f32 	%f241, %f62, %f240;
	fma.rn.ftz.f32 	%f242, %f61, %f239, %f241;
	ld.volatile.shared.f32 	%f243, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+32];
	fma.rn.ftz.f32 	%f304, %f63, %f243, %f242;
	@%p10 bra 	BB0_55;

	setp.ltu.ftz.f32	%p30, %f304, 0f00000000;
	@%p30 bra 	BB0_48;
	bra.uni 	BB0_47;

BB0_48:
	neg.ftz.f32 	%f246, %f304;
	lg2.approx.ftz.f32 	%f247, %f246;
	mul.ftz.f32 	%f248, %f247, 0f3ED55555;
	ex2.approx.ftz.f32 	%f249, %f248;
	neg.ftz.f32 	%f304, %f249;
	bra.uni 	BB0_49;

BB0_55:
	ld.volatile.shared.f32 	%f272, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f273, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+16];
	mul.ftz.f32 	%f274, %f62, %f273;
	fma.rn.ftz.f32 	%f275, %f61, %f272, %f274;
	ld.volatile.shared.f32 	%f276, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f305, %f63, %f276, %f275;
	ld.volatile.shared.f32 	%f277, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix];
	ld.volatile.shared.f32 	%f278, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+4];
	mul.ftz.f32 	%f279, %f62, %f278;
	fma.rn.ftz.f32 	%f280, %f61, %f277, %f279;
	ld.volatile.shared.f32 	%f281, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f306, %f63, %f281, %f280;
	bra.uni 	BB0_56;

BB0_47:
	lg2.approx.ftz.f32 	%f244, %f304;
	mul.ftz.f32 	%f245, %f244, 0f3ED55555;
	ex2.approx.ftz.f32 	%f304, %f245;

BB0_49:
	ld.volatile.shared.f32 	%f250, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f251, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+16];
	mul.ftz.f32 	%f252, %f62, %f251;
	fma.rn.ftz.f32 	%f253, %f61, %f250, %f252;
	ld.volatile.shared.f32 	%f254, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f68, %f63, %f254, %f253;
	setp.ltu.ftz.f32	%p31, %f68, 0f00000000;
	@%p31 bra 	BB0_51;
	bra.uni 	BB0_50;

BB0_51:
	neg.ftz.f32 	%f257, %f68;
	lg2.approx.ftz.f32 	%f258, %f257;
	mul.ftz.f32 	%f259, %f258, 0f3ED55555;
	ex2.approx.ftz.f32 	%f260, %f259;
	neg.ftz.f32 	%f305, %f260;
	bra.uni 	BB0_52;

BB0_50:
	lg2.approx.ftz.f32 	%f255, %f68;
	mul.ftz.f32 	%f256, %f255, 0f3ED55555;
	ex2.approx.ftz.f32 	%f305, %f256;

BB0_52:
	ld.volatile.shared.f32 	%f261, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix];
	ld.volatile.shared.f32 	%f262, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+4];
	mul.ftz.f32 	%f263, %f62, %f262;
	fma.rn.ftz.f32 	%f264, %f61, %f261, %f263;
	ld.volatile.shared.f32 	%f265, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f72, %f63, %f265, %f264;
	setp.ltu.ftz.f32	%p32, %f72, 0f00000000;
	@%p32 bra 	BB0_54;
	bra.uni 	BB0_53;

BB0_54:
	neg.ftz.f32 	%f268, %f72;
	lg2.approx.ftz.f32 	%f269, %f268;
	mul.ftz.f32 	%f270, %f269, 0f3ED55555;
	ex2.approx.ftz.f32 	%f271, %f270;
	neg.ftz.f32 	%f306, %f271;
	bra.uni 	BB0_56;

BB0_53:
	lg2.approx.ftz.f32 	%f266, %f72;
	mul.ftz.f32 	%f267, %f266, 0f3ED55555;
	ex2.approx.ftz.f32 	%f306, %f267;

BB0_56:
	add.s32 	%r14, %r12, %r9;
	@%p14 bra 	BB0_58;

	cvta.to.global.u64 	%rd71, %rd3;
	mul.wide.s32 	%rd72, %r14, 16;
	add.s64 	%rd73, %rd71, %rd72;
	mov.f32 	%f282, 0f3F800000;
	st.global.v4.f32 	[%rd73], {%f304, %f305, %f306, %f282};
	bra.uni 	BB0_59;

BB0_58:
	cvta.to.global.u64 	%rd74, %rd3;
	// inline asm
	{  cvt.rn.f16.f32 %rs13, %f304;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs14, %f305;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs15, %f306;}

	// inline asm
	mov.f32 	%f286, 0f3F800000;
	// inline asm
	{  cvt.rn.f16.f32 %rs16, %f286;}

	// inline asm
	mul.wide.s32 	%rd75, %r14, 8;
	add.s64 	%rd76, %rd74, %rd75;
	st.global.u16 	[%rd76], %rs13;
	st.global.u16 	[%rd76+2], %rs14;
	st.global.u16 	[%rd76+4], %rs15;
	st.global.u16 	[%rd76+6], %rs16;

BB0_59:
	ret;
}

	// .globl	PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel
.visible .entry PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel(
	.param .u64 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_0,
	.param .u64 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_1,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_2,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_3,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_4,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_5,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_6,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_7,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_8,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_9,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_10,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_11,
	.param .align 16 .b8 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_12[16],
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_13,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_14
)
{
	.reg .pred 	%p<32>;
	.reg .b16 	%rs<17>;
	.reg .f32 	%f<293>;
	.reg .b32 	%r<92>;
	.reg .b64 	%rd<62>;
	// demoted variable
	.shared .align 4 .b8 _ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix[36];

	ld.param.u64 	%rd3, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_0];
	ld.param.u64 	%rd2, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_1];
	ld.param.u32 	%r10, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_2];
	ld.param.u32 	%r11, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_3];
	ld.param.u32 	%r12, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_4];
	ld.param.u32 	%r13, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_6];
	ld.param.u32 	%r14, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_7];
	ld.param.u32 	%r15, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_8];
	ld.param.u32 	%r16, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_9];
	ld.param.u32 	%r17, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_10];
	ld.param.u32 	%r18, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_11];
	ld.param.f32 	%f73, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_12+8];
	ld.param.f32 	%f72, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_12+4];
	ld.param.f32 	%f71, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_12];
	ld.param.u32 	%r19, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_13];
	ld.param.u32 	%r20, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel_param_14];
	cvta.to.global.u64 	%rd1, %rd3;
	mov.u32 	%r1, %tid.x;
	mov.u32 	%r2, %tid.y;
	setp.ne.s32	%p1, %r2, 0;
	setp.gt.u32	%p2, %r1, 2;
	or.pred  	%p3, %p1, %p2;
	@%p3 bra 	BB1_2;

	cvt.s64.s32	%rd4, %r19;
	setp.ne.s32	%p4, %r18, 0;
	mul.lo.s32 	%r21, %r1, 3;
	cvt.s64.s32	%rd5, %r21;
	selp.b64	%rd6, 2, 0, %p4;
	add.s64 	%rd7, %rd4, %rd6;
	add.s64 	%rd8, %rd7, %rd5;
	shl.b64 	%rd9, %rd8, 2;
	add.s64 	%rd10, %rd1, %rd9;
	ld.global.f32 	%f75, [%rd10];
	shl.b32 	%r22, %r21, 2;
	mov.u32 	%r23, _ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix;
	add.s32 	%r24, %r23, %r22;
	st.volatile.shared.f32 	[%r24], %f75;
	add.s32 	%r25, %r19, %r21;
	mul.wide.s32 	%rd11, %r25, 4;
	add.s64 	%rd12, %rd1, %rd11;
	ld.global.f32 	%f76, [%rd12+4];
	st.volatile.shared.f32 	[%r24+4], %f76;
	selp.b64	%rd13, 0, 2, %p4;
	add.s64 	%rd14, %rd4, %rd13;
	add.s64 	%rd15, %rd14, %rd5;
	shl.b64 	%rd16, %rd15, 2;
	add.s64 	%rd17, %rd1, %rd16;
	ld.global.f32 	%f77, [%rd17];
	st.volatile.shared.f32 	[%r24+8], %f77;

BB1_2:
	bar.sync 	0;
	mov.u32 	%r26, %ctaid.x;
	mov.u32 	%r27, %ntid.x;
	mad.lo.s32 	%r28, %r27, %r26, %r1;
	shl.b32 	%r3, %r28, 1;
	setp.ge.s32	%p5, %r3, %r16;
	mov.u32 	%r29, %ctaid.y;
	mov.u32 	%r30, %ntid.y;
	mad.lo.s32 	%r31, %r30, %r29, %r2;
	shl.b32 	%r4, %r31, 1;
	setp.ge.s32	%p6, %r4, %r17;
	or.pred  	%p7, %p5, %p6;
	@%p7 bra 	BB1_59;

	cvt.s64.s32	%rd18, %r10;
	add.s32 	%r32, %r17, -1;
	mul.lo.s32 	%r33, %r32, %r11;
	cvt.s64.s32	%rd19, %r33;
	neg.s32 	%r34, %r11;
	setp.eq.s32	%p8, %r12, 0;
	selp.b32	%r35, %r11, %r34, %p8;
	selp.b64	%rd20, 0, %rd19, %p8;
	add.s64 	%rd21, %rd20, %rd18;
	mul.lo.s32 	%r36, %r4, %r35;
	add.s32 	%r37, %r36, %r3;
	cvt.s64.s32	%rd22, %r37;
	add.s64 	%rd23, %rd22, %rd21;
	shl.b64 	%rd24, %rd23, 2;
	add.s64 	%rd25, %rd1, %rd24;
	add.s32 	%r38, %r3, 1;
	add.s32 	%r39, %r36, %r38;
	cvt.s64.s32	%rd26, %r39;
	add.s64 	%rd27, %rd26, %rd21;
	shl.b64 	%rd28, %rd27, 2;
	add.s64 	%rd29, %rd1, %rd28;
	add.s32 	%r40, %r4, 1;
	mul.lo.s32 	%r41, %r40, %r35;
	add.s32 	%r42, %r41, %r3;
	cvt.s64.s32	%rd30, %r42;
	add.s64 	%rd31, %rd30, %rd21;
	shl.b64 	%rd32, %rd31, 2;
	add.s64 	%rd33, %rd1, %rd32;
	ld.global.f32 	%f1, [%rd33];
	add.s32 	%r43, %r41, %r38;
	cvt.s64.s32	%rd34, %r43;
	add.s64 	%rd35, %rd34, %rd21;
	shl.b64 	%rd36, %rd35, 2;
	add.s64 	%rd37, %rd1, %rd36;
	ld.global.f32 	%f78, [%rd25];
	min.ftz.f32 	%f2, %f78, %f71;
	ld.global.f32 	%f79, [%rd29];
	min.ftz.f32 	%f4, %f79, %f72;
	ld.global.f32 	%f80, [%rd37];
	min.ftz.f32 	%f5, %f80, %f73;
	ld.volatile.shared.f32 	%f81, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+24];
	ld.volatile.shared.f32 	%f82, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+28];
	mul.ftz.f32 	%f83, %f4, %f82;
	fma.rn.ftz.f32 	%f84, %f2, %f81, %f83;
	ld.volatile.shared.f32 	%f85, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+32];
	fma.rn.ftz.f32 	%f275, %f5, %f85, %f84;
	setp.eq.s32	%p9, %r20, 0;
	@%p9 bra 	BB1_13;

	setp.ltu.ftz.f32	%p10, %f275, 0f00000000;
	@%p10 bra 	BB1_6;
	bra.uni 	BB1_5;

BB1_6:
	neg.ftz.f32 	%f88, %f275;
	lg2.approx.ftz.f32 	%f89, %f88;
	mul.ftz.f32 	%f90, %f89, 0f3ED55555;
	ex2.approx.ftz.f32 	%f91, %f90;
	neg.ftz.f32 	%f275, %f91;
	bra.uni 	BB1_7;

BB1_13:
	ld.volatile.shared.f32 	%f114, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f115, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+16];
	mul.ftz.f32 	%f116, %f4, %f115;
	fma.rn.ftz.f32 	%f117, %f2, %f114, %f116;
	ld.volatile.shared.f32 	%f118, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f276, %f5, %f118, %f117;
	ld.volatile.shared.f32 	%f119, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix];
	ld.volatile.shared.f32 	%f120, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+4];
	mul.ftz.f32 	%f121, %f4, %f120;
	fma.rn.ftz.f32 	%f122, %f2, %f119, %f121;
	ld.volatile.shared.f32 	%f123, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f277, %f5, %f123, %f122;
	bra.uni 	BB1_14;

BB1_5:
	lg2.approx.ftz.f32 	%f86, %f275;
	mul.ftz.f32 	%f87, %f86, 0f3ED55555;
	ex2.approx.ftz.f32 	%f275, %f87;

BB1_7:
	ld.volatile.shared.f32 	%f92, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f93, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+16];
	mul.ftz.f32 	%f94, %f4, %f93;
	fma.rn.ftz.f32 	%f95, %f2, %f92, %f94;
	ld.volatile.shared.f32 	%f96, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f10, %f5, %f96, %f95;
	setp.ltu.ftz.f32	%p11, %f10, 0f00000000;
	@%p11 bra 	BB1_9;
	bra.uni 	BB1_8;

BB1_9:
	neg.ftz.f32 	%f99, %f10;
	lg2.approx.ftz.f32 	%f100, %f99;
	mul.ftz.f32 	%f101, %f100, 0f3ED55555;
	ex2.approx.ftz.f32 	%f102, %f101;
	neg.ftz.f32 	%f276, %f102;
	bra.uni 	BB1_10;

BB1_8:
	lg2.approx.ftz.f32 	%f97, %f10;
	mul.ftz.f32 	%f98, %f97, 0f3ED55555;
	ex2.approx.ftz.f32 	%f276, %f98;

BB1_10:
	ld.volatile.shared.f32 	%f103, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix];
	ld.volatile.shared.f32 	%f104, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+4];
	mul.ftz.f32 	%f105, %f4, %f104;
	fma.rn.ftz.f32 	%f106, %f2, %f103, %f105;
	ld.volatile.shared.f32 	%f107, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f14, %f5, %f107, %f106;
	setp.ltu.ftz.f32	%p12, %f14, 0f00000000;
	@%p12 bra 	BB1_12;
	bra.uni 	BB1_11;

BB1_12:
	neg.ftz.f32 	%f110, %f14;
	lg2.approx.ftz.f32 	%f111, %f110;
	mul.ftz.f32 	%f112, %f111, 0f3ED55555;
	ex2.approx.ftz.f32 	%f113, %f112;
	neg.ftz.f32 	%f277, %f113;
	bra.uni 	BB1_14;

BB1_11:
	lg2.approx.ftz.f32 	%f108, %f14;
	mul.ftz.f32 	%f109, %f108, 0f3ED55555;
	ex2.approx.ftz.f32 	%f277, %f109;

BB1_14:
	sub.s32 	%r50, %r32, %r4;
	setp.eq.s32	%p13, %r14, 0;
	selp.b32	%r51, %r4, %r50, %p13;
	mad.lo.s32 	%r5, %r51, %r13, %r3;
	setp.eq.s32	%p14, %r15, 0;
	@%p14 bra 	BB1_16;

	cvta.to.global.u64 	%rd38, %rd2;
	mul.wide.s32 	%rd39, %r5, 16;
	add.s64 	%rd40, %rd38, %rd39;
	mov.f32 	%f124, 0f3F800000;
	st.global.v4.f32 	[%rd40], {%f275, %f276, %f277, %f124};
	bra.uni 	BB1_17;

BB1_16:
	cvta.to.global.u64 	%rd41, %rd2;
	// inline asm
	{  cvt.rn.f16.f32 %rs1, %f275;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs2, %f276;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs3, %f277;}

	// inline asm
	mov.f32 	%f128, 0f3F800000;
	// inline asm
	{  cvt.rn.f16.f32 %rs4, %f128;}

	// inline asm
	mul.wide.s32 	%rd42, %r5, 8;
	add.s64 	%rd43, %rd41, %rd42;
	st.global.u16 	[%rd43], %rs1;
	st.global.u16 	[%rd43+2], %rs2;
	st.global.u16 	[%rd43+4], %rs3;
	st.global.u16 	[%rd43+6], %rs4;

BB1_17:
	ld.volatile.shared.f32 	%f129, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+24];
	ld.volatile.shared.f32 	%f130, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+28];
	mul.ftz.f32 	%f131, %f4, %f130;
	fma.rn.ftz.f32 	%f132, %f2, %f129, %f131;
	ld.volatile.shared.f32 	%f133, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+32];
	fma.rn.ftz.f32 	%f280, %f5, %f133, %f132;
	@%p9 bra 	BB1_27;

	setp.ltu.ftz.f32	%p16, %f280, 0f00000000;
	@%p16 bra 	BB1_20;
	bra.uni 	BB1_19;

BB1_20:
	neg.ftz.f32 	%f136, %f280;
	lg2.approx.ftz.f32 	%f137, %f136;
	mul.ftz.f32 	%f138, %f137, 0f3ED55555;
	ex2.approx.ftz.f32 	%f139, %f138;
	neg.ftz.f32 	%f280, %f139;
	bra.uni 	BB1_21;

BB1_27:
	ld.volatile.shared.f32 	%f162, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f163, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+16];
	mul.ftz.f32 	%f164, %f4, %f163;
	fma.rn.ftz.f32 	%f165, %f2, %f162, %f164;
	ld.volatile.shared.f32 	%f166, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f281, %f5, %f166, %f165;
	ld.volatile.shared.f32 	%f167, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix];
	ld.volatile.shared.f32 	%f168, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+4];
	mul.ftz.f32 	%f169, %f4, %f168;
	fma.rn.ftz.f32 	%f170, %f2, %f167, %f169;
	ld.volatile.shared.f32 	%f171, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f282, %f5, %f171, %f170;
	bra.uni 	BB1_28;

BB1_19:
	lg2.approx.ftz.f32 	%f134, %f280;
	mul.ftz.f32 	%f135, %f134, 0f3ED55555;
	ex2.approx.ftz.f32 	%f280, %f135;

BB1_21:
	ld.volatile.shared.f32 	%f140, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f141, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+16];
	mul.ftz.f32 	%f142, %f4, %f141;
	fma.rn.ftz.f32 	%f143, %f2, %f140, %f142;
	ld.volatile.shared.f32 	%f144, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f26, %f5, %f144, %f143;
	setp.ltu.ftz.f32	%p17, %f26, 0f00000000;
	@%p17 bra 	BB1_23;
	bra.uni 	BB1_22;

BB1_23:
	neg.ftz.f32 	%f147, %f26;
	lg2.approx.ftz.f32 	%f148, %f147;
	mul.ftz.f32 	%f149, %f148, 0f3ED55555;
	ex2.approx.ftz.f32 	%f150, %f149;
	neg.ftz.f32 	%f281, %f150;
	bra.uni 	BB1_24;

BB1_22:
	lg2.approx.ftz.f32 	%f145, %f26;
	mul.ftz.f32 	%f146, %f145, 0f3ED55555;
	ex2.approx.ftz.f32 	%f281, %f146;

BB1_24:
	ld.volatile.shared.f32 	%f151, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix];
	ld.volatile.shared.f32 	%f152, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+4];
	mul.ftz.f32 	%f153, %f4, %f152;
	fma.rn.ftz.f32 	%f154, %f2, %f151, %f153;
	ld.volatile.shared.f32 	%f155, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f30, %f5, %f155, %f154;
	setp.ltu.ftz.f32	%p18, %f30, 0f00000000;
	@%p18 bra 	BB1_26;
	bra.uni 	BB1_25;

BB1_26:
	neg.ftz.f32 	%f158, %f30;
	lg2.approx.ftz.f32 	%f159, %f158;
	mul.ftz.f32 	%f160, %f159, 0f3ED55555;
	ex2.approx.ftz.f32 	%f161, %f160;
	neg.ftz.f32 	%f282, %f161;
	bra.uni 	BB1_28;

BB1_25:
	lg2.approx.ftz.f32 	%f156, %f30;
	mul.ftz.f32 	%f157, %f156, 0f3ED55555;
	ex2.approx.ftz.f32 	%f282, %f157;

BB1_28:
	add.s32 	%r6, %r5, 1;
	@%p14 bra 	BB1_30;

	cvta.to.global.u64 	%rd44, %rd2;
	mul.wide.s32 	%rd45, %r6, 16;
	add.s64 	%rd46, %rd44, %rd45;
	mov.f32 	%f172, 0f3F800000;
	st.global.v4.f32 	[%rd46], {%f280, %f281, %f282, %f172};
	bra.uni 	BB1_31;

BB1_30:
	cvta.to.global.u64 	%rd47, %rd2;
	// inline asm
	{  cvt.rn.f16.f32 %rs5, %f280;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs6, %f281;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs7, %f282;}

	// inline asm
	mov.f32 	%f176, 0f3F800000;
	// inline asm
	{  cvt.rn.f16.f32 %rs8, %f176;}

	// inline asm
	mul.wide.s32 	%rd48, %r6, 8;
	add.s64 	%rd49, %rd47, %rd48;
	st.global.u16 	[%rd49], %rs5;
	st.global.u16 	[%rd49+2], %rs6;
	st.global.u16 	[%rd49+4], %rs7;
	st.global.u16 	[%rd49+6], %rs8;

BB1_31:
	ld.volatile.shared.f32 	%f177, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+24];
	ld.volatile.shared.f32 	%f178, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+28];
	min.ftz.f32 	%f38, %f1, %f72;
	mul.ftz.f32 	%f179, %f38, %f178;
	fma.rn.ftz.f32 	%f180, %f2, %f177, %f179;
	ld.volatile.shared.f32 	%f181, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+32];
	fma.rn.ftz.f32 	%f285, %f5, %f181, %f180;
	@%p9 bra 	BB1_41;

	setp.ltu.ftz.f32	%p22, %f285, 0f00000000;
	@%p22 bra 	BB1_34;
	bra.uni 	BB1_33;

BB1_34:
	neg.ftz.f32 	%f184, %f285;
	lg2.approx.ftz.f32 	%f185, %f184;
	mul.ftz.f32 	%f186, %f185, 0f3ED55555;
	ex2.approx.ftz.f32 	%f187, %f186;
	neg.ftz.f32 	%f285, %f187;
	bra.uni 	BB1_35;

BB1_41:
	ld.volatile.shared.f32 	%f210, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f211, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+16];
	mul.ftz.f32 	%f212, %f38, %f211;
	fma.rn.ftz.f32 	%f213, %f2, %f210, %f212;
	ld.volatile.shared.f32 	%f214, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f286, %f5, %f214, %f213;
	ld.volatile.shared.f32 	%f215, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix];
	ld.volatile.shared.f32 	%f216, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+4];
	mul.ftz.f32 	%f217, %f38, %f216;
	fma.rn.ftz.f32 	%f218, %f2, %f215, %f217;
	ld.volatile.shared.f32 	%f219, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f287, %f5, %f219, %f218;
	bra.uni 	BB1_42;

BB1_33:
	lg2.approx.ftz.f32 	%f182, %f285;
	mul.ftz.f32 	%f183, %f182, 0f3ED55555;
	ex2.approx.ftz.f32 	%f285, %f183;

BB1_35:
	ld.volatile.shared.f32 	%f188, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f189, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+16];
	mul.ftz.f32 	%f190, %f38, %f189;
	fma.rn.ftz.f32 	%f191, %f2, %f188, %f190;
	ld.volatile.shared.f32 	%f192, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f43, %f5, %f192, %f191;
	setp.ltu.ftz.f32	%p23, %f43, 0f00000000;
	@%p23 bra 	BB1_37;
	bra.uni 	BB1_36;

BB1_37:
	neg.ftz.f32 	%f195, %f43;
	lg2.approx.ftz.f32 	%f196, %f195;
	mul.ftz.f32 	%f197, %f196, 0f3ED55555;
	ex2.approx.ftz.f32 	%f198, %f197;
	neg.ftz.f32 	%f286, %f198;
	bra.uni 	BB1_38;

BB1_36:
	lg2.approx.ftz.f32 	%f193, %f43;
	mul.ftz.f32 	%f194, %f193, 0f3ED55555;
	ex2.approx.ftz.f32 	%f286, %f194;

BB1_38:
	ld.volatile.shared.f32 	%f199, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix];
	ld.volatile.shared.f32 	%f200, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+4];
	mul.ftz.f32 	%f201, %f38, %f200;
	fma.rn.ftz.f32 	%f202, %f2, %f199, %f201;
	ld.volatile.shared.f32 	%f203, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f47, %f5, %f203, %f202;
	setp.ltu.ftz.f32	%p24, %f47, 0f00000000;
	@%p24 bra 	BB1_40;
	bra.uni 	BB1_39;

BB1_40:
	neg.ftz.f32 	%f206, %f47;
	lg2.approx.ftz.f32 	%f207, %f206;
	mul.ftz.f32 	%f208, %f207, 0f3ED55555;
	ex2.approx.ftz.f32 	%f209, %f208;
	neg.ftz.f32 	%f287, %f209;
	bra.uni 	BB1_42;

BB1_39:
	lg2.approx.ftz.f32 	%f204, %f47;
	mul.ftz.f32 	%f205, %f204, 0f3ED55555;
	ex2.approx.ftz.f32 	%f287, %f205;

BB1_42:
	selp.b32	%r79, 1, -1, %p13;
	add.s32 	%r80, %r51, %r79;
	mul.lo.s32 	%r7, %r80, %r13;
	add.s32 	%r8, %r7, %r3;
	@%p14 bra 	BB1_44;

	cvta.to.global.u64 	%rd50, %rd2;
	mul.wide.s32 	%rd51, %r8, 16;
	add.s64 	%rd52, %rd50, %rd51;
	mov.f32 	%f220, 0f3F800000;
	st.global.v4.f32 	[%rd52], {%f285, %f286, %f287, %f220};
	bra.uni 	BB1_45;

BB1_44:
	cvta.to.global.u64 	%rd53, %rd2;
	// inline asm
	{  cvt.rn.f16.f32 %rs9, %f285;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs10, %f286;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs11, %f287;}

	// inline asm
	mov.f32 	%f224, 0f3F800000;
	// inline asm
	{  cvt.rn.f16.f32 %rs12, %f224;}

	// inline asm
	mul.wide.s32 	%rd54, %r8, 8;
	add.s64 	%rd55, %rd53, %rd54;
	st.global.u16 	[%rd55], %rs9;
	st.global.u16 	[%rd55+2], %rs10;
	st.global.u16 	[%rd55+4], %rs11;
	st.global.u16 	[%rd55+6], %rs12;

BB1_45:
	ld.volatile.shared.f32 	%f225, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+24];
	ld.volatile.shared.f32 	%f226, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+28];
	mul.ftz.f32 	%f227, %f38, %f226;
	fma.rn.ftz.f32 	%f228, %f2, %f225, %f227;
	ld.volatile.shared.f32 	%f229, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+32];
	fma.rn.ftz.f32 	%f290, %f5, %f229, %f228;
	@%p9 bra 	BB1_55;

	setp.ltu.ftz.f32	%p28, %f290, 0f00000000;
	@%p28 bra 	BB1_48;
	bra.uni 	BB1_47;

BB1_48:
	neg.ftz.f32 	%f232, %f290;
	lg2.approx.ftz.f32 	%f233, %f232;
	mul.ftz.f32 	%f234, %f233, 0f3ED55555;
	ex2.approx.ftz.f32 	%f235, %f234;
	neg.ftz.f32 	%f290, %f235;
	bra.uni 	BB1_49;

BB1_55:
	ld.volatile.shared.f32 	%f258, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f259, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+16];
	mul.ftz.f32 	%f260, %f38, %f259;
	fma.rn.ftz.f32 	%f261, %f2, %f258, %f260;
	ld.volatile.shared.f32 	%f262, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f291, %f5, %f262, %f261;
	ld.volatile.shared.f32 	%f263, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix];
	ld.volatile.shared.f32 	%f264, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+4];
	mul.ftz.f32 	%f265, %f38, %f264;
	fma.rn.ftz.f32 	%f266, %f2, %f263, %f265;
	ld.volatile.shared.f32 	%f267, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f292, %f5, %f267, %f266;
	bra.uni 	BB1_56;

BB1_47:
	lg2.approx.ftz.f32 	%f230, %f290;
	mul.ftz.f32 	%f231, %f230, 0f3ED55555;
	ex2.approx.ftz.f32 	%f290, %f231;

BB1_49:
	ld.volatile.shared.f32 	%f236, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f237, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+16];
	mul.ftz.f32 	%f238, %f38, %f237;
	fma.rn.ftz.f32 	%f239, %f2, %f236, %f238;
	ld.volatile.shared.f32 	%f240, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f59, %f5, %f240, %f239;
	setp.ltu.ftz.f32	%p29, %f59, 0f00000000;
	@%p29 bra 	BB1_51;
	bra.uni 	BB1_50;

BB1_51:
	neg.ftz.f32 	%f243, %f59;
	lg2.approx.ftz.f32 	%f244, %f243;
	mul.ftz.f32 	%f245, %f244, 0f3ED55555;
	ex2.approx.ftz.f32 	%f246, %f245;
	neg.ftz.f32 	%f291, %f246;
	bra.uni 	BB1_52;

BB1_50:
	lg2.approx.ftz.f32 	%f241, %f59;
	mul.ftz.f32 	%f242, %f241, 0f3ED55555;
	ex2.approx.ftz.f32 	%f291, %f242;

BB1_52:
	ld.volatile.shared.f32 	%f247, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix];
	ld.volatile.shared.f32 	%f248, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+4];
	mul.ftz.f32 	%f249, %f38, %f248;
	fma.rn.ftz.f32 	%f250, %f2, %f247, %f249;
	ld.volatile.shared.f32 	%f251, [_ZZ56PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f63, %f5, %f251, %f250;
	setp.ltu.ftz.f32	%p30, %f63, 0f00000000;
	@%p30 bra 	BB1_54;
	bra.uni 	BB1_53;

BB1_54:
	neg.ftz.f32 	%f254, %f63;
	lg2.approx.ftz.f32 	%f255, %f254;
	mul.ftz.f32 	%f256, %f255, 0f3ED55555;
	ex2.approx.ftz.f32 	%f257, %f256;
	neg.ftz.f32 	%f292, %f257;
	bra.uni 	BB1_56;

BB1_53:
	lg2.approx.ftz.f32 	%f252, %f63;
	mul.ftz.f32 	%f253, %f252, 0f3ED55555;
	ex2.approx.ftz.f32 	%f292, %f253;

BB1_56:
	add.s32 	%r91, %r3, %r7;
	add.s32 	%r9, %r91, 1;
	@%p14 bra 	BB1_58;

	cvta.to.global.u64 	%rd56, %rd2;
	mul.wide.s32 	%rd57, %r9, 16;
	add.s64 	%rd58, %rd56, %rd57;
	mov.f32 	%f268, 0f3F800000;
	st.global.v4.f32 	[%rd58], {%f290, %f291, %f292, %f268};
	bra.uni 	BB1_59;

BB1_58:
	cvta.to.global.u64 	%rd59, %rd2;
	// inline asm
	{  cvt.rn.f16.f32 %rs13, %f290;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs14, %f291;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs15, %f292;}

	// inline asm
	mov.f32 	%f272, 0f3F800000;
	// inline asm
	{  cvt.rn.f16.f32 %rs16, %f272;}

	// inline asm
	mul.wide.s32 	%rd60, %r9, 8;
	add.s64 	%rd61, %rd59, %rd60;
	st.global.u16 	[%rd61], %rs13;
	st.global.u16 	[%rd61+2], %rs14;
	st.global.u16 	[%rd61+4], %rs15;
	st.global.u16 	[%rd61+6], %rs16;

BB1_59:
	ret;
}

	// .globl	PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel
.visible .entry PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel(
	.param .u64 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_0,
	.param .u64 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_1,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_2,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_3,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_4,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_5,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_6,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_7,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_8,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_9,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_10,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_11,
	.param .align 16 .b8 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_12[16],
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_13,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_14
)
{
	.reg .pred 	%p<45>;
	.reg .b16 	%rs<17>;
	.reg .f32 	%f<356>;
	.reg .b32 	%r<94>;
	.reg .b64 	%rd<74>;
	// demoted variable
	.shared .align 4 .b8 _ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix[36];

	ld.param.u64 	%rd8, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_0];
	ld.param.u64 	%rd7, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_1];
	ld.param.u32 	%r16, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_2];
	ld.param.u32 	%r17, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_3];
	ld.param.u32 	%r18, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_4];
	ld.param.u32 	%r19, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_6];
	ld.param.u32 	%r20, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_7];
	ld.param.u32 	%r21, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_8];
	ld.param.u32 	%r22, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_9];
	ld.param.u32 	%r23, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_10];
	ld.param.u32 	%r24, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_11];
	ld.param.f32 	%f107, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_12+8];
	ld.param.f32 	%f106, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_12+4];
	ld.param.f32 	%f105, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_12];
	ld.param.u32 	%r25, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_13];
	ld.param.u32 	%r26, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel_param_14];
	cvta.to.global.u64 	%rd1, %rd8;
	mov.u32 	%r27, %ntid.x;
	mov.u32 	%r28, %ctaid.x;
	mov.u32 	%r1, %tid.x;
	mad.lo.s32 	%r2, %r27, %r28, %r1;
	mov.u32 	%r29, %ntid.y;
	mov.u32 	%r30, %ctaid.y;
	mov.u32 	%r31, %tid.y;
	mad.lo.s32 	%r3, %r29, %r30, %r31;
	setp.ne.s32	%p1, %r31, 0;
	setp.gt.u32	%p2, %r1, 2;
	or.pred  	%p3, %p1, %p2;
	@%p3 bra 	BB2_2;

	cvt.s64.s32	%rd9, %r25;
	setp.ne.s32	%p4, %r24, 0;
	mul.lo.s32 	%r32, %r1, 3;
	cvt.s64.s32	%rd10, %r32;
	selp.b64	%rd11, 2, 0, %p4;
	add.s64 	%rd12, %rd9, %rd11;
	add.s64 	%rd13, %rd12, %rd10;
	shl.b64 	%rd14, %rd13, 2;
	add.s64 	%rd15, %rd1, %rd14;
	ld.global.f32 	%f109, [%rd15];
	shl.b32 	%r33, %r32, 2;
	mov.u32 	%r34, _ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix;
	add.s32 	%r35, %r34, %r33;
	st.volatile.shared.f32 	[%r35], %f109;
	add.s32 	%r36, %r25, %r32;
	mul.wide.s32 	%rd16, %r36, 4;
	add.s64 	%rd17, %rd1, %rd16;
	ld.global.f32 	%f110, [%rd17+4];
	st.volatile.shared.f32 	[%r35+4], %f110;
	selp.b64	%rd18, 0, 2, %p4;
	add.s64 	%rd19, %rd9, %rd18;
	add.s64 	%rd20, %rd19, %rd10;
	shl.b64 	%rd21, %rd20, 2;
	add.s64 	%rd22, %rd1, %rd21;
	ld.global.f32 	%f111, [%rd22];
	st.volatile.shared.f32 	[%r35+8], %f111;

BB2_2:
	bar.sync 	0;
	shl.b32 	%r4, %r2, 1;
	setp.ge.s32	%p5, %r4, %r22;
	shl.b32 	%r5, %r3, 1;
	setp.ge.s32	%p6, %r5, %r23;
	or.pred  	%p7, %p5, %p6;
	@%p7 bra 	BB2_79;

	cvt.s64.s32	%rd23, %r16;
	add.s32 	%r37, %r23, -1;
	mul.lo.s32 	%r38, %r37, %r17;
	cvt.s64.s32	%rd24, %r38;
	neg.s32 	%r39, %r17;
	setp.eq.s32	%p8, %r18, 0;
	selp.b32	%r6, %r17, %r39, %p8;
	selp.b64	%rd25, 0, %rd24, %p8;
	add.s64 	%rd2, %rd25, %rd23;
	add.s32 	%r7, %r22, -2;
	add.s32 	%r8, %r23, -2;
	mul.lo.s32 	%r9, %r5, %r6;
	add.s32 	%r40, %r9, %r4;
	cvt.s64.s32	%rd26, %r40;
	add.s64 	%rd27, %rd26, %rd2;
	shl.b64 	%rd28, %rd27, 2;
	add.s64 	%rd29, %rd1, %rd28;
	ld.global.f32 	%f1, [%rd29];
	ld.global.f32 	%f2, [%rd29+4];
	add.s32 	%r41, %r5, 1;
	mad.lo.s32 	%r42, %r41, %r6, %r4;
	cvt.s64.s32	%rd30, %r42;
	add.s64 	%rd31, %rd30, %rd2;
	shl.b64 	%rd32, %rd31, 2;
	add.s64 	%rd3, %rd1, %rd32;
	ld.global.f32 	%f3, [%rd3];
	ld.global.f32 	%f4, [%rd3+4];
	setp.eq.s32	%p9, %r2, 0;
	mov.f32 	%f326, %f4;
	@%p9 bra 	BB2_5;

	ld.global.f32 	%f326, [%rd3+-4];

BB2_5:
	setp.ge.s32	%p10, %r4, %r7;
	mov.f32 	%f327, %f3;
	@%p10 bra 	BB2_7;

	ld.global.f32 	%f327, [%rd3+8];

BB2_7:
	mov.f32 	%f328, %f2;
	@%p9 bra 	BB2_9;

	ld.global.f32 	%f328, [%rd29+-4];

BB2_9:
	mov.f32 	%f329, %f1;
	@%p10 bra 	BB2_11;

	ld.global.f32 	%f329, [%rd29+8];

BB2_11:
	setp.eq.s32	%p14, %r3, 0;
	or.pred  	%p15, %p14, %p9;
	add.s32 	%r44, %r5, -1;
	mad.lo.s32 	%r45, %r44, %r6, %r4;
	add.s32 	%r46, %r45, -1;
	cvt.s64.s32	%rd36, %r46;
	add.s64 	%rd37, %rd36, %rd2;
	shl.b64 	%rd38, %rd37, 2;
	add.s64 	%rd5, %rd1, %rd38;
	mov.f32 	%f330, %f4;
	@%p15 bra 	BB2_13;

	ld.global.f32 	%f330, [%rd5];

BB2_13:
	mov.f32 	%f331, %f3;
	@%p14 bra 	BB2_15;

	cvt.s64.s32	%rd39, %r45;
	add.s64 	%rd40, %rd39, %rd2;
	shl.b64 	%rd41, %rd40, 2;
	add.s64 	%rd42, %rd1, %rd41;
	ld.global.f32 	%f331, [%rd42];

BB2_15:
	mov.f32 	%f332, %f4;
	@%p14 bra 	BB2_17;

	ld.global.f32 	%f332, [%rd5+8];

BB2_17:
	setp.ge.s32	%p18, %r5, %r8;
	mov.f32 	%f333, %f1;
	@%p18 bra 	BB2_19;

	add.s32 	%r49, %r5, 2;
	mad.lo.s32 	%r50, %r49, %r6, %r4;
	cvt.s64.s32	%rd43, %r50;
	add.s64 	%rd44, %rd43, %rd2;
	shl.b64 	%rd45, %rd44, 2;
	add.s64 	%rd46, %rd1, %rd45;
	ld.global.f32 	%f333, [%rd46];

BB2_19:
	add.s32 	%r51, %r5, 2;
	mad.lo.s32 	%r52, %r51, %r6, %r4;
	add.s32 	%r53, %r52, 1;
	cvt.s64.s32	%rd47, %r53;
	add.s64 	%rd48, %rd47, %rd2;
	shl.b64 	%rd49, %rd48, 2;
	add.s64 	%rd6, %rd1, %rd49;
	mov.f32 	%f334, %f2;
	@%p18 bra 	BB2_21;

	ld.global.f32 	%f334, [%rd6];

BB2_21:
	or.pred  	%p22, %p18, %p10;
	mov.f32 	%f335, %f1;
	@%p22 bra 	BB2_23;

	ld.global.f32 	%f335, [%rd6+4];

BB2_23:
	add.ftz.f32 	%f112, %f330, %f332;
	add.ftz.f32 	%f113, %f326, %f112;
	add.ftz.f32 	%f114, %f4, %f113;
	mul.ftz.f32 	%f115, %f114, 0f3E800000;
	add.ftz.f32 	%f116, %f2, %f328;
	add.ftz.f32 	%f117, %f116, %f331;
	add.ftz.f32 	%f118, %f3, %f117;
	mul.ftz.f32 	%f119, %f118, 0f3E800000;
	min.ftz.f32 	%f26, %f1, %f105;
	min.ftz.f32 	%f28, %f119, %f106;
	min.ftz.f32 	%f30, %f115, %f107;
	ld.volatile.shared.f32 	%f120, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+24];
	ld.volatile.shared.f32 	%f121, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+28];
	mul.ftz.f32 	%f122, %f28, %f121;
	fma.rn.ftz.f32 	%f123, %f26, %f120, %f122;
	ld.volatile.shared.f32 	%f124, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+32];
	fma.rn.ftz.f32 	%f338, %f30, %f124, %f123;
	setp.eq.s32	%p23, %r26, 0;
	@%p23 bra 	BB2_33;

	setp.ltu.ftz.f32	%p24, %f338, 0f00000000;
	@%p24 bra 	BB2_26;
	bra.uni 	BB2_25;

BB2_26:
	neg.ftz.f32 	%f127, %f338;
	lg2.approx.ftz.f32 	%f128, %f127;
	mul.ftz.f32 	%f129, %f128, 0f3ED55555;
	ex2.approx.ftz.f32 	%f130, %f129;
	neg.ftz.f32 	%f338, %f130;
	bra.uni 	BB2_27;

BB2_33:
	ld.volatile.shared.f32 	%f153, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f154, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+16];
	mul.ftz.f32 	%f155, %f28, %f154;
	fma.rn.ftz.f32 	%f156, %f26, %f153, %f155;
	ld.volatile.shared.f32 	%f157, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f339, %f30, %f157, %f156;
	ld.volatile.shared.f32 	%f158, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix];
	ld.volatile.shared.f32 	%f159, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+4];
	mul.ftz.f32 	%f160, %f28, %f159;
	fma.rn.ftz.f32 	%f161, %f26, %f158, %f160;
	ld.volatile.shared.f32 	%f162, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f340, %f30, %f162, %f161;
	bra.uni 	BB2_34;

BB2_25:
	lg2.approx.ftz.f32 	%f125, %f338;
	mul.ftz.f32 	%f126, %f125, 0f3ED55555;
	ex2.approx.ftz.f32 	%f338, %f126;

BB2_27:
	ld.volatile.shared.f32 	%f131, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f132, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+16];
	mul.ftz.f32 	%f133, %f28, %f132;
	fma.rn.ftz.f32 	%f134, %f26, %f131, %f133;
	ld.volatile.shared.f32 	%f135, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f35, %f30, %f135, %f134;
	setp.ltu.ftz.f32	%p25, %f35, 0f00000000;
	@%p25 bra 	BB2_29;
	bra.uni 	BB2_28;

BB2_29:
	neg.ftz.f32 	%f138, %f35;
	lg2.approx.ftz.f32 	%f139, %f138;
	mul.ftz.f32 	%f140, %f139, 0f3ED55555;
	ex2.approx.ftz.f32 	%f141, %f140;
	neg.ftz.f32 	%f339, %f141;
	bra.uni 	BB2_30;

BB2_28:
	lg2.approx.ftz.f32 	%f136, %f35;
	mul.ftz.f32 	%f137, %f136, 0f3ED55555;
	ex2.approx.ftz.f32 	%f339, %f137;

BB2_30:
	ld.volatile.shared.f32 	%f142, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix];
	ld.volatile.shared.f32 	%f143, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+4];
	mul.ftz.f32 	%f144, %f28, %f143;
	fma.rn.ftz.f32 	%f145, %f26, %f142, %f144;
	ld.volatile.shared.f32 	%f146, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f39, %f30, %f146, %f145;
	setp.ltu.ftz.f32	%p26, %f39, 0f00000000;
	@%p26 bra 	BB2_32;
	bra.uni 	BB2_31;

BB2_32:
	neg.ftz.f32 	%f149, %f39;
	lg2.approx.ftz.f32 	%f150, %f149;
	mul.ftz.f32 	%f151, %f150, 0f3ED55555;
	ex2.approx.ftz.f32 	%f152, %f151;
	neg.ftz.f32 	%f340, %f152;
	bra.uni 	BB2_34;

BB2_31:
	lg2.approx.ftz.f32 	%f147, %f39;
	mul.ftz.f32 	%f148, %f147, 0f3ED55555;
	ex2.approx.ftz.f32 	%f340, %f148;

BB2_34:
	sub.s32 	%r60, %r37, %r5;
	setp.eq.s32	%p27, %r20, 0;
	selp.b32	%r61, %r5, %r60, %p27;
	mul.lo.s32 	%r10, %r61, %r19;
	add.s32 	%r11, %r10, %r4;
	setp.eq.s32	%p28, %r21, 0;
	@%p28 bra 	BB2_36;

	cvta.to.global.u64 	%rd50, %rd7;
	mul.wide.s32 	%rd51, %r11, 16;
	add.s64 	%rd52, %rd50, %rd51;
	mov.f32 	%f163, 0f3F800000;
	st.global.v4.f32 	[%rd52], {%f338, %f339, %f340, %f163};
	bra.uni 	BB2_37;

BB2_36:
	cvta.to.global.u64 	%rd53, %rd7;
	// inline asm
	{  cvt.rn.f16.f32 %rs1, %f338;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs2, %f339;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs3, %f340;}

	// inline asm
	mov.f32 	%f167, 0f3F800000;
	// inline asm
	{  cvt.rn.f16.f32 %rs4, %f167;}

	// inline asm
	mul.wide.s32 	%rd54, %r11, 8;
	add.s64 	%rd55, %rd53, %rd54;
	st.global.u16 	[%rd55], %rs1;
	st.global.u16 	[%rd55+2], %rs2;
	st.global.u16 	[%rd55+4], %rs3;
	st.global.u16 	[%rd55+6], %rs4;

BB2_37:
	add.ftz.f32 	%f168, %f4, %f332;
	mul.ftz.f32 	%f169, %f168, 0f3F000000;
	add.ftz.f32 	%f47, %f1, %f329;
	mul.ftz.f32 	%f170, %f47, 0f3F000000;
	min.ftz.f32 	%f48, %f170, %f105;
	min.ftz.f32 	%f49, %f169, %f107;
	ld.volatile.shared.f32 	%f171, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+24];
	ld.volatile.shared.f32 	%f172, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+28];
	min.ftz.f32 	%f50, %f2, %f106;
	mul.ftz.f32 	%f173, %f50, %f172;
	fma.rn.ftz.f32 	%f174, %f48, %f171, %f173;
	ld.volatile.shared.f32 	%f175, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+32];
	fma.rn.ftz.f32 	%f343, %f49, %f175, %f174;
	@%p23 bra 	BB2_47;

	setp.ltu.ftz.f32	%p30, %f343, 0f00000000;
	@%p30 bra 	BB2_40;
	bra.uni 	BB2_39;

BB2_40:
	neg.ftz.f32 	%f178, %f343;
	lg2.approx.ftz.f32 	%f179, %f178;
	mul.ftz.f32 	%f180, %f179, 0f3ED55555;
	ex2.approx.ftz.f32 	%f181, %f180;
	neg.ftz.f32 	%f343, %f181;
	bra.uni 	BB2_41;

BB2_47:
	ld.volatile.shared.f32 	%f204, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f205, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+16];
	mul.ftz.f32 	%f206, %f50, %f205;
	fma.rn.ftz.f32 	%f207, %f48, %f204, %f206;
	ld.volatile.shared.f32 	%f208, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f344, %f49, %f208, %f207;
	ld.volatile.shared.f32 	%f209, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix];
	ld.volatile.shared.f32 	%f210, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+4];
	mul.ftz.f32 	%f211, %f50, %f210;
	fma.rn.ftz.f32 	%f212, %f48, %f209, %f211;
	ld.volatile.shared.f32 	%f213, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f345, %f49, %f213, %f212;
	bra.uni 	BB2_48;

BB2_39:
	lg2.approx.ftz.f32 	%f176, %f343;
	mul.ftz.f32 	%f177, %f176, 0f3ED55555;
	ex2.approx.ftz.f32 	%f343, %f177;

BB2_41:
	ld.volatile.shared.f32 	%f182, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f183, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+16];
	mul.ftz.f32 	%f184, %f50, %f183;
	fma.rn.ftz.f32 	%f185, %f48, %f182, %f184;
	ld.volatile.shared.f32 	%f186, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f55, %f49, %f186, %f185;
	setp.ltu.ftz.f32	%p31, %f55, 0f00000000;
	@%p31 bra 	BB2_43;
	bra.uni 	BB2_42;

BB2_43:
	neg.ftz.f32 	%f189, %f55;
	lg2.approx.ftz.f32 	%f190, %f189;
	mul.ftz.f32 	%f191, %f190, 0f3ED55555;
	ex2.approx.ftz.f32 	%f192, %f191;
	neg.ftz.f32 	%f344, %f192;
	bra.uni 	BB2_44;

BB2_42:
	lg2.approx.ftz.f32 	%f187, %f55;
	mul.ftz.f32 	%f188, %f187, 0f3ED55555;
	ex2.approx.ftz.f32 	%f344, %f188;

BB2_44:
	ld.volatile.shared.f32 	%f193, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix];
	ld.volatile.shared.f32 	%f194, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+4];
	mul.ftz.f32 	%f195, %f50, %f194;
	fma.rn.ftz.f32 	%f196, %f48, %f193, %f195;
	ld.volatile.shared.f32 	%f197, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f59, %f49, %f197, %f196;
	setp.ltu.ftz.f32	%p32, %f59, 0f00000000;
	@%p32 bra 	BB2_46;
	bra.uni 	BB2_45;

BB2_46:
	neg.ftz.f32 	%f200, %f59;
	lg2.approx.ftz.f32 	%f201, %f200;
	mul.ftz.f32 	%f202, %f201, 0f3ED55555;
	ex2.approx.ftz.f32 	%f203, %f202;
	neg.ftz.f32 	%f345, %f203;
	bra.uni 	BB2_48;

BB2_45:
	lg2.approx.ftz.f32 	%f198, %f59;
	mul.ftz.f32 	%f199, %f198, 0f3ED55555;
	ex2.approx.ftz.f32 	%f345, %f199;

BB2_48:
	add.s32 	%r72, %r4, %r10;
	add.s32 	%r12, %r72, 1;
	@%p28 bra 	BB2_50;

	cvta.to.global.u64 	%rd56, %rd7;
	mul.wide.s32 	%rd57, %r12, 16;
	add.s64 	%rd58, %rd56, %rd57;
	mov.f32 	%f214, 0f3F800000;
	st.global.v4.f32 	[%rd58], {%f343, %f344, %f345, %f214};
	bra.uni 	BB2_51;

BB2_50:
	cvta.to.global.u64 	%rd59, %rd7;
	// inline asm
	{  cvt.rn.f16.f32 %rs5, %f343;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs6, %f344;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs7, %f345;}

	// inline asm
	mov.f32 	%f218, 0f3F800000;
	// inline asm
	{  cvt.rn.f16.f32 %rs8, %f218;}

	// inline asm
	mul.wide.s32 	%rd60, %r12, 8;
	add.s64 	%rd61, %rd59, %rd60;
	st.global.u16 	[%rd61], %rs5;
	st.global.u16 	[%rd61+2], %rs6;
	st.global.u16 	[%rd61+4], %rs7;
	st.global.u16 	[%rd61+6], %rs8;

BB2_51:
	add.ftz.f32 	%f219, %f4, %f326;
	mul.ftz.f32 	%f220, %f219, 0f3F000000;
	add.ftz.f32 	%f221, %f1, %f333;
	mul.ftz.f32 	%f222, %f221, 0f3F000000;
	min.ftz.f32 	%f67, %f222, %f105;
	min.ftz.f32 	%f68, %f220, %f107;
	ld.volatile.shared.f32 	%f223, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+24];
	ld.volatile.shared.f32 	%f224, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+28];
	min.ftz.f32 	%f69, %f3, %f106;
	mul.ftz.f32 	%f225, %f69, %f224;
	fma.rn.ftz.f32 	%f226, %f67, %f223, %f225;
	ld.volatile.shared.f32 	%f227, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+32];
	fma.rn.ftz.f32 	%f348, %f68, %f227, %f226;
	@%p23 bra 	BB2_61;

	setp.ltu.ftz.f32	%p35, %f348, 0f00000000;
	@%p35 bra 	BB2_54;
	bra.uni 	BB2_53;

BB2_54:
	neg.ftz.f32 	%f230, %f348;
	lg2.approx.ftz.f32 	%f231, %f230;
	mul.ftz.f32 	%f232, %f231, 0f3ED55555;
	ex2.approx.ftz.f32 	%f233, %f232;
	neg.ftz.f32 	%f348, %f233;
	bra.uni 	BB2_55;

BB2_61:
	ld.volatile.shared.f32 	%f256, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f257, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+16];
	mul.ftz.f32 	%f258, %f69, %f257;
	fma.rn.ftz.f32 	%f259, %f67, %f256, %f258;
	ld.volatile.shared.f32 	%f260, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f349, %f68, %f260, %f259;
	ld.volatile.shared.f32 	%f261, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix];
	ld.volatile.shared.f32 	%f262, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+4];
	mul.ftz.f32 	%f263, %f69, %f262;
	fma.rn.ftz.f32 	%f264, %f67, %f261, %f263;
	ld.volatile.shared.f32 	%f265, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f350, %f68, %f265, %f264;
	bra.uni 	BB2_62;

BB2_53:
	lg2.approx.ftz.f32 	%f228, %f348;
	mul.ftz.f32 	%f229, %f228, 0f3ED55555;
	ex2.approx.ftz.f32 	%f348, %f229;

BB2_55:
	ld.volatile.shared.f32 	%f234, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f235, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+16];
	mul.ftz.f32 	%f236, %f69, %f235;
	fma.rn.ftz.f32 	%f237, %f67, %f234, %f236;
	ld.volatile.shared.f32 	%f238, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f74, %f68, %f238, %f237;
	setp.ltu.ftz.f32	%p36, %f74, 0f00000000;
	@%p36 bra 	BB2_57;
	bra.uni 	BB2_56;

BB2_57:
	neg.ftz.f32 	%f241, %f74;
	lg2.approx.ftz.f32 	%f242, %f241;
	mul.ftz.f32 	%f243, %f242, 0f3ED55555;
	ex2.approx.ftz.f32 	%f244, %f243;
	neg.ftz.f32 	%f349, %f244;
	bra.uni 	BB2_58;

BB2_56:
	lg2.approx.ftz.f32 	%f239, %f74;
	mul.ftz.f32 	%f240, %f239, 0f3ED55555;
	ex2.approx.ftz.f32 	%f349, %f240;

BB2_58:
	ld.volatile.shared.f32 	%f245, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix];
	ld.volatile.shared.f32 	%f246, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+4];
	mul.ftz.f32 	%f247, %f69, %f246;
	fma.rn.ftz.f32 	%f248, %f67, %f245, %f247;
	ld.volatile.shared.f32 	%f249, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f78, %f68, %f249, %f248;
	setp.ltu.ftz.f32	%p37, %f78, 0f00000000;
	@%p37 bra 	BB2_60;
	bra.uni 	BB2_59;

BB2_60:
	neg.ftz.f32 	%f252, %f78;
	lg2.approx.ftz.f32 	%f253, %f252;
	mul.ftz.f32 	%f254, %f253, 0f3ED55555;
	ex2.approx.ftz.f32 	%f255, %f254;
	neg.ftz.f32 	%f350, %f255;
	bra.uni 	BB2_62;

BB2_59:
	lg2.approx.ftz.f32 	%f250, %f78;
	mul.ftz.f32 	%f251, %f250, 0f3ED55555;
	ex2.approx.ftz.f32 	%f350, %f251;

BB2_62:
	selp.b32	%r81, 1, -1, %p27;
	add.s32 	%r82, %r61, %r81;
	mul.lo.s32 	%r13, %r82, %r19;
	add.s32 	%r14, %r13, %r4;
	@%p28 bra 	BB2_64;

	cvta.to.global.u64 	%rd62, %rd7;
	mul.wide.s32 	%rd63, %r14, 16;
	add.s64 	%rd64, %rd62, %rd63;
	mov.f32 	%f266, 0f3F800000;
	st.global.v4.f32 	[%rd64], {%f348, %f349, %f350, %f266};
	bra.uni 	BB2_65;

BB2_64:
	cvta.to.global.u64 	%rd65, %rd7;
	// inline asm
	{  cvt.rn.f16.f32 %rs9, %f348;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs10, %f349;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs11, %f350;}

	// inline asm
	mov.f32 	%f270, 0f3F800000;
	// inline asm
	{  cvt.rn.f16.f32 %rs12, %f270;}

	// inline asm
	mul.wide.s32 	%rd66, %r14, 8;
	add.s64 	%rd67, %rd65, %rd66;
	st.global.u16 	[%rd67], %rs9;
	st.global.u16 	[%rd67+2], %rs10;
	st.global.u16 	[%rd67+4], %rs11;
	st.global.u16 	[%rd67+6], %rs12;

BB2_65:
	add.ftz.f32 	%f271, %f2, %f3;
	add.ftz.f32 	%f272, %f271, %f327;
	add.ftz.f32 	%f273, %f272, %f334;
	mul.ftz.f32 	%f274, %f273, 0f3E800000;
	add.ftz.f32 	%f275, %f47, %f333;
	add.ftz.f32 	%f276, %f275, %f335;
	mul.ftz.f32 	%f277, %f276, 0f3E800000;
	min.ftz.f32 	%f86, %f277, %f105;
	min.ftz.f32 	%f87, %f274, %f106;
	ld.volatile.shared.f32 	%f278, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+24];
	ld.volatile.shared.f32 	%f279, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+28];
	mul.ftz.f32 	%f280, %f87, %f279;
	fma.rn.ftz.f32 	%f281, %f86, %f278, %f280;
	ld.volatile.shared.f32 	%f282, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+32];
	min.ftz.f32 	%f88, %f4, %f107;
	fma.rn.ftz.f32 	%f353, %f88, %f282, %f281;
	@%p23 bra 	BB2_75;

	setp.ltu.ftz.f32	%p41, %f353, 0f00000000;
	@%p41 bra 	BB2_68;
	bra.uni 	BB2_67;

BB2_68:
	neg.ftz.f32 	%f285, %f353;
	lg2.approx.ftz.f32 	%f286, %f285;
	mul.ftz.f32 	%f287, %f286, 0f3ED55555;
	ex2.approx.ftz.f32 	%f288, %f287;
	neg.ftz.f32 	%f353, %f288;
	bra.uni 	BB2_69;

BB2_75:
	ld.volatile.shared.f32 	%f311, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f312, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+16];
	mul.ftz.f32 	%f313, %f87, %f312;
	fma.rn.ftz.f32 	%f314, %f86, %f311, %f313;
	ld.volatile.shared.f32 	%f315, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f354, %f88, %f315, %f314;
	ld.volatile.shared.f32 	%f316, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix];
	ld.volatile.shared.f32 	%f317, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+4];
	mul.ftz.f32 	%f318, %f87, %f317;
	fma.rn.ftz.f32 	%f319, %f86, %f316, %f318;
	ld.volatile.shared.f32 	%f320, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f355, %f88, %f320, %f319;
	bra.uni 	BB2_76;

BB2_67:
	lg2.approx.ftz.f32 	%f283, %f353;
	mul.ftz.f32 	%f284, %f283, 0f3ED55555;
	ex2.approx.ftz.f32 	%f353, %f284;

BB2_69:
	ld.volatile.shared.f32 	%f289, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f290, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+16];
	mul.ftz.f32 	%f291, %f87, %f290;
	fma.rn.ftz.f32 	%f292, %f86, %f289, %f291;
	ld.volatile.shared.f32 	%f293, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f93, %f88, %f293, %f292;
	setp.ltu.ftz.f32	%p42, %f93, 0f00000000;
	@%p42 bra 	BB2_71;
	bra.uni 	BB2_70;

BB2_71:
	neg.ftz.f32 	%f296, %f93;
	lg2.approx.ftz.f32 	%f297, %f296;
	mul.ftz.f32 	%f298, %f297, 0f3ED55555;
	ex2.approx.ftz.f32 	%f299, %f298;
	neg.ftz.f32 	%f354, %f299;
	bra.uni 	BB2_72;

BB2_70:
	lg2.approx.ftz.f32 	%f294, %f93;
	mul.ftz.f32 	%f295, %f294, 0f3ED55555;
	ex2.approx.ftz.f32 	%f354, %f295;

BB2_72:
	ld.volatile.shared.f32 	%f300, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix];
	ld.volatile.shared.f32 	%f301, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+4];
	mul.ftz.f32 	%f302, %f87, %f301;
	fma.rn.ftz.f32 	%f303, %f86, %f300, %f302;
	ld.volatile.shared.f32 	%f304, [_ZZ55PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f97, %f88, %f304, %f303;
	setp.ltu.ftz.f32	%p43, %f97, 0f00000000;
	@%p43 bra 	BB2_74;
	bra.uni 	BB2_73;

BB2_74:
	neg.ftz.f32 	%f307, %f97;
	lg2.approx.ftz.f32 	%f308, %f307;
	mul.ftz.f32 	%f309, %f308, 0f3ED55555;
	ex2.approx.ftz.f32 	%f310, %f309;
	neg.ftz.f32 	%f355, %f310;
	bra.uni 	BB2_76;

BB2_73:
	lg2.approx.ftz.f32 	%f305, %f97;
	mul.ftz.f32 	%f306, %f305, 0f3ED55555;
	ex2.approx.ftz.f32 	%f355, %f306;

BB2_76:
	add.s32 	%r93, %r4, %r13;
	add.s32 	%r15, %r93, 1;
	@%p28 bra 	BB2_78;

	cvta.to.global.u64 	%rd68, %rd7;
	mul.wide.s32 	%rd69, %r15, 16;
	add.s64 	%rd70, %rd68, %rd69;
	mov.f32 	%f321, 0f3F800000;
	st.global.v4.f32 	[%rd70], {%f353, %f354, %f355, %f321};
	bra.uni 	BB2_79;

BB2_78:
	cvta.to.global.u64 	%rd71, %rd7;
	// inline asm
	{  cvt.rn.f16.f32 %rs13, %f353;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs14, %f354;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs15, %f355;}

	// inline asm
	mov.f32 	%f325, 0f3F800000;
	// inline asm
	{  cvt.rn.f16.f32 %rs16, %f325;}

	// inline asm
	mul.wide.s32 	%rd72, %r15, 8;
	add.s64 	%rd73, %rd71, %rd72;
	st.global.u16 	[%rd73], %rs13;
	st.global.u16 	[%rd73+2], %rs14;
	st.global.u16 	[%rd73+4], %rs15;
	st.global.u16 	[%rd73+6], %rs16;

BB2_79:
	ret;
}

	// .globl	PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel
.visible .entry PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel(
	.param .u64 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel_param_0,
	.param .u64 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel_param_1,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel_param_2,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel_param_3,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel_param_4,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel_param_5,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel_param_6,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel_param_7,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel_param_8,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel_param_9,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel_param_10,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel_param_11
)
{
	.reg .pred 	%p<61>;
	.reg .b16 	%rs<17>;
	.reg .f32 	%f<302>;
	.reg .b32 	%r<337>;
	.reg .b64 	%rd<152>;


	ld.param.u64 	%rd5, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel_param_0];
	ld.param.u64 	%rd6, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel_param_1];
	ld.param.u32 	%r11, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel_param_2];
	ld.param.u32 	%r12, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel_param_3];
	ld.param.u32 	%r13, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel_param_4];
	ld.param.u32 	%r14, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel_param_6];
	ld.param.u32 	%r15, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel_param_7];
	ld.param.u32 	%r16, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel_param_8];
	ld.param.u32 	%r17, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel_param_9];
	cvta.to.global.u64 	%rd1, %rd5;
	mov.u32 	%r18, %ntid.x;
	mov.u32 	%r19, %ctaid.x;
	mov.u32 	%r20, %tid.x;
	mad.lo.s32 	%r21, %r18, %r19, %r20;
	mov.u32 	%r22, %ntid.y;
	mov.u32 	%r23, %ctaid.y;
	mov.u32 	%r24, %tid.y;
	mad.lo.s32 	%r25, %r22, %r23, %r24;
	shl.b32 	%r1, %r21, 1;
	shl.b32 	%r2, %r25, 1;
	setp.ge.s32	%p1, %r1, %r16;
	setp.ge.s32	%p2, %r2, %r17;
	or.pred  	%p3, %p1, %p2;
	@%p3 bra 	BB3_81;

	cvt.s64.s32	%rd7, %r11;
	add.s32 	%r26, %r17, -1;
	mul.lo.s32 	%r27, %r26, %r12;
	cvt.s64.s32	%rd8, %r27;
	neg.s32 	%r28, %r12;
	setp.eq.s32	%p4, %r13, 0;
	selp.b32	%r3, %r12, %r28, %p4;
	selp.b64	%rd9, 0, %rd8, %p4;
	add.s64 	%rd2, %rd9, %rd7;
	mul.lo.s32 	%r4, %r2, %r3;
	add.s32 	%r29, %r4, %r1;
	cvt.s64.s32	%rd10, %r29;
	add.s64 	%rd11, %rd10, %rd2;
	shl.b64 	%rd12, %rd11, 2;
	add.s64 	%rd13, %rd1, %rd12;
	ld.global.f32 	%f1, [%rd13];
	setp.ltu.ftz.f32	%p5, %f1, 0f00000000;
	@%p5 bra 	BB3_3;
	bra.uni 	BB3_2;

BB3_3:
	neg.ftz.f32 	%f83, %f1;
	lg2.approx.ftz.f32 	%f84, %f83;
	mul.ftz.f32 	%f85, %f84, 0f3ED55555;
	ex2.approx.ftz.f32 	%f86, %f85;
	neg.ftz.f32 	%f284, %f86;
	bra.uni 	BB3_4;

BB3_2:
	lg2.approx.ftz.f32 	%f81, %f1;
	mul.ftz.f32 	%f82, %f81, 0f3ED55555;
	ex2.approx.ftz.f32 	%f284, %f82;

BB3_4:
	ld.global.f32 	%f5, [%rd13+4];
	setp.ltu.ftz.f32	%p6, %f5, 0f00000000;
	@%p6 bra 	BB3_6;
	bra.uni 	BB3_5;

BB3_6:
	neg.ftz.f32 	%f89, %f5;
	lg2.approx.ftz.f32 	%f90, %f89;
	mul.ftz.f32 	%f91, %f90, 0f3ED55555;
	ex2.approx.ftz.f32 	%f92, %f91;
	neg.ftz.f32 	%f285, %f92;
	bra.uni 	BB3_7;

BB3_5:
	lg2.approx.ftz.f32 	%f87, %f5;
	mul.ftz.f32 	%f88, %f87, 0f3ED55555;
	ex2.approx.ftz.f32 	%f285, %f88;

BB3_7:
	add.s32 	%r31, %r2, 1;
	mad.lo.s32 	%r32, %r31, %r3, %r1;
	cvt.s64.s32	%rd17, %r32;
	add.s64 	%rd18, %rd17, %rd2;
	shl.b64 	%rd19, %rd18, 2;
	add.s64 	%rd20, %rd1, %rd19;
	ld.global.f32 	%f9, [%rd20];
	setp.ltu.ftz.f32	%p7, %f9, 0f00000000;
	@%p7 bra 	BB3_9;
	bra.uni 	BB3_8;

BB3_9:
	neg.ftz.f32 	%f95, %f9;
	lg2.approx.ftz.f32 	%f96, %f95;
	mul.ftz.f32 	%f97, %f96, 0f3ED55555;
	ex2.approx.ftz.f32 	%f98, %f97;
	neg.ftz.f32 	%f286, %f98;
	bra.uni 	BB3_10;

BB3_8:
	lg2.approx.ftz.f32 	%f93, %f9;
	mul.ftz.f32 	%f94, %f93, 0f3ED55555;
	ex2.approx.ftz.f32 	%f286, %f94;

BB3_10:
	ld.global.f32 	%f13, [%rd20+4];
	setp.ltu.ftz.f32	%p9, %f13, 0f00000000;
	@%p9 bra 	BB3_12;
	bra.uni 	BB3_11;

BB3_12:
	neg.ftz.f32 	%f101, %f13;
	lg2.approx.ftz.f32 	%f102, %f101;
	mul.ftz.f32 	%f103, %f102, 0f3ED55555;
	ex2.approx.ftz.f32 	%f104, %f103;
	neg.ftz.f32 	%f287, %f104;
	bra.uni 	BB3_13;

BB3_11:
	lg2.approx.ftz.f32 	%f99, %f13;
	mul.ftz.f32 	%f100, %f99, 0f3ED55555;
	ex2.approx.ftz.f32 	%f287, %f100;

BB3_13:
	setp.lt.s32	%p10, %r21, 1;
	mov.f32 	%f288, %f287;
	@%p10 bra 	BB3_17;

	ld.global.f32 	%f17, [%rd20+-4];
	setp.ltu.ftz.f32	%p12, %f17, 0f00000000;
	@%p12 bra 	BB3_16;
	bra.uni 	BB3_15;

BB3_16:
	neg.ftz.f32 	%f107, %f17;
	lg2.approx.ftz.f32 	%f108, %f107;
	mul.ftz.f32 	%f109, %f108, 0f3ED55555;
	ex2.approx.ftz.f32 	%f110, %f109;
	neg.ftz.f32 	%f288, %f110;
	bra.uni 	BB3_17;

BB3_15:
	lg2.approx.ftz.f32 	%f105, %f17;
	mul.ftz.f32 	%f106, %f105, 0f3ED55555;
	ex2.approx.ftz.f32 	%f288, %f106;

BB3_17:
	add.s32 	%r74, %r16, -2;
	setp.ge.s32	%p13, %r1, %r74;
	mov.f32 	%f289, %f286;
	@%p13 bra 	BB3_21;

	ld.global.f32 	%f21, [%rd20+8];
	setp.ltu.ftz.f32	%p15, %f21, 0f00000000;
	@%p15 bra 	BB3_20;
	bra.uni 	BB3_19;

BB3_20:
	neg.ftz.f32 	%f113, %f21;
	lg2.approx.ftz.f32 	%f114, %f113;
	mul.ftz.f32 	%f115, %f114, 0f3ED55555;
	ex2.approx.ftz.f32 	%f116, %f115;
	neg.ftz.f32 	%f289, %f116;
	bra.uni 	BB3_21;

BB3_19:
	lg2.approx.ftz.f32 	%f111, %f21;
	mul.ftz.f32 	%f112, %f111, 0f3ED55555;
	ex2.approx.ftz.f32 	%f289, %f112;

BB3_21:
	add.s32 	%r96, %r16, -3;
	setp.ge.s32	%p16, %r1, %r96;
	mov.f32 	%f290, %f287;
	@%p16 bra 	BB3_25;

	ld.global.f32 	%f25, [%rd20+12];
	setp.ltu.ftz.f32	%p18, %f25, 0f00000000;
	@%p18 bra 	BB3_24;
	bra.uni 	BB3_23;

BB3_24:
	neg.ftz.f32 	%f119, %f25;
	lg2.approx.ftz.f32 	%f120, %f119;
	mul.ftz.f32 	%f121, %f120, 0f3ED55555;
	ex2.approx.ftz.f32 	%f122, %f121;
	neg.ftz.f32 	%f290, %f122;
	bra.uni 	BB3_25;

BB3_23:
	lg2.approx.ftz.f32 	%f117, %f25;
	mul.ftz.f32 	%f118, %f117, 0f3ED55555;
	ex2.approx.ftz.f32 	%f290, %f118;

BB3_25:
	setp.lt.s32	%p19, %r1, 2;
	mov.f32 	%f291, %f284;
	@%p19 bra 	BB3_29;

	ld.global.f32 	%f29, [%rd13+-8];
	setp.ltu.ftz.f32	%p20, %f29, 0f00000000;
	@%p20 bra 	BB3_28;
	bra.uni 	BB3_27;

BB3_28:
	neg.ftz.f32 	%f125, %f29;
	lg2.approx.ftz.f32 	%f126, %f125;
	mul.ftz.f32 	%f127, %f126, 0f3ED55555;
	ex2.approx.ftz.f32 	%f128, %f127;
	neg.ftz.f32 	%f291, %f128;
	bra.uni 	BB3_29;

BB3_27:
	lg2.approx.ftz.f32 	%f123, %f29;
	mul.ftz.f32 	%f124, %f123, 0f3ED55555;
	ex2.approx.ftz.f32 	%f291, %f124;

BB3_29:
	mov.f32 	%f292, %f285;
	@%p10 bra 	BB3_33;

	ld.global.f32 	%f33, [%rd13+-4];
	setp.ltu.ftz.f32	%p22, %f33, 0f00000000;
	@%p22 bra 	BB3_32;
	bra.uni 	BB3_31;

BB3_32:
	neg.ftz.f32 	%f131, %f33;
	lg2.approx.ftz.f32 	%f132, %f131;
	mul.ftz.f32 	%f133, %f132, 0f3ED55555;
	ex2.approx.ftz.f32 	%f134, %f133;
	neg.ftz.f32 	%f292, %f134;
	bra.uni 	BB3_33;

BB3_31:
	lg2.approx.ftz.f32 	%f129, %f33;
	mul.ftz.f32 	%f130, %f129, 0f3ED55555;
	ex2.approx.ftz.f32 	%f292, %f130;

BB3_33:
	mov.f32 	%f293, %f284;
	@%p13 bra 	BB3_37;

	ld.global.f32 	%f37, [%rd13+8];
	setp.ltu.ftz.f32	%p24, %f37, 0f00000000;
	@%p24 bra 	BB3_36;
	bra.uni 	BB3_35;

BB3_36:
	neg.ftz.f32 	%f137, %f37;
	lg2.approx.ftz.f32 	%f138, %f137;
	mul.ftz.f32 	%f139, %f138, 0f3ED55555;
	ex2.approx.ftz.f32 	%f140, %f139;
	neg.ftz.f32 	%f293, %f140;
	bra.uni 	BB3_37;

BB3_35:
	lg2.approx.ftz.f32 	%f135, %f37;
	mul.ftz.f32 	%f136, %f135, 0f3ED55555;
	ex2.approx.ftz.f32 	%f293, %f136;

BB3_37:
	setp.lt.s32	%p25, %r25, 1;
	or.pred  	%p27, %p25, %p10;
	add.s32 	%r137, %r2, -1;
	mad.lo.s32 	%r141, %r137, %r3, %r1;
	add.s32 	%r142, %r141, -1;
	cvt.s64.s32	%rd57, %r142;
	add.s64 	%rd4, %rd57, %rd2;
	mov.f32 	%f294, %f287;
	@%p27 bra 	BB3_41;

	shl.b64 	%rd63, %rd4, 2;
	add.s64 	%rd64, %rd1, %rd63;
	ld.global.f32 	%f41, [%rd64];
	setp.ltu.ftz.f32	%p29, %f41, 0f00000000;
	@%p29 bra 	BB3_40;
	bra.uni 	BB3_39;

BB3_40:
	neg.ftz.f32 	%f143, %f41;
	lg2.approx.ftz.f32 	%f144, %f143;
	mul.ftz.f32 	%f145, %f144, 0f3ED55555;
	ex2.approx.ftz.f32 	%f146, %f145;
	neg.ftz.f32 	%f294, %f146;
	bra.uni 	BB3_41;

BB3_39:
	lg2.approx.ftz.f32 	%f141, %f41;
	mul.ftz.f32 	%f142, %f141, 0f3ED55555;
	ex2.approx.ftz.f32 	%f294, %f142;

BB3_41:
	mov.f32 	%f295, %f286;
	@%p25 bra 	BB3_45;

	cvt.s64.s32	%rd65, %r141;
	add.s64 	%rd70, %rd65, %rd2;
	shl.b64 	%rd72, %rd70, 2;
	add.s64 	%rd73, %rd1, %rd72;
	ld.global.f32 	%f45, [%rd73];
	setp.ltu.ftz.f32	%p32, %f45, 0f00000000;
	@%p32 bra 	BB3_44;
	bra.uni 	BB3_43;

BB3_44:
	neg.ftz.f32 	%f149, %f45;
	lg2.approx.ftz.f32 	%f150, %f149;
	mul.ftz.f32 	%f151, %f150, 0f3ED55555;
	ex2.approx.ftz.f32 	%f152, %f151;
	neg.ftz.f32 	%f295, %f152;
	bra.uni 	BB3_45;

BB3_43:
	lg2.approx.ftz.f32 	%f147, %f45;
	mul.ftz.f32 	%f148, %f147, 0f3ED55555;
	ex2.approx.ftz.f32 	%f295, %f148;

BB3_45:
	mov.f32 	%f296, %f287;
	@%p25 bra 	BB3_49;

	shl.b64 	%rd81, %rd4, 2;
	add.s64 	%rd82, %rd1, %rd81;
	ld.global.f32 	%f49, [%rd82+8];
	setp.ltu.ftz.f32	%p35, %f49, 0f00000000;
	@%p35 bra 	BB3_48;
	bra.uni 	BB3_47;

BB3_48:
	neg.ftz.f32 	%f155, %f49;
	lg2.approx.ftz.f32 	%f156, %f155;
	mul.ftz.f32 	%f157, %f156, 0f3ED55555;
	ex2.approx.ftz.f32 	%f158, %f157;
	neg.ftz.f32 	%f296, %f158;
	bra.uni 	BB3_49;

BB3_47:
	lg2.approx.ftz.f32 	%f153, %f49;
	mul.ftz.f32 	%f154, %f153, 0f3ED55555;
	ex2.approx.ftz.f32 	%f296, %f154;

BB3_49:
	setp.lt.s32	%p36, %r2, 2;
	mov.f32 	%f297, %f284;
	@%p36 bra 	BB3_53;

	add.s32 	%r196, %r2, -2;
	mad.lo.s32 	%r204, %r196, %r3, %r1;
	cvt.s64.s32	%rd83, %r204;
	add.s64 	%rd88, %rd83, %rd2;
	shl.b64 	%rd90, %rd88, 2;
	add.s64 	%rd91, %rd1, %rd90;
	ld.global.f32 	%f53, [%rd91];
	setp.ltu.ftz.f32	%p38, %f53, 0f00000000;
	@%p38 bra 	BB3_52;
	bra.uni 	BB3_51;

BB3_52:
	neg.ftz.f32 	%f161, %f53;
	lg2.approx.ftz.f32 	%f162, %f161;
	mul.ftz.f32 	%f163, %f162, 0f3ED55555;
	ex2.approx.ftz.f32 	%f164, %f163;
	neg.ftz.f32 	%f297, %f164;
	bra.uni 	BB3_53;

BB3_51:
	lg2.approx.ftz.f32 	%f159, %f53;
	mul.ftz.f32 	%f160, %f159, 0f3ED55555;
	ex2.approx.ftz.f32 	%f297, %f160;

BB3_53:
	add.s32 	%r212, %r17, -2;
	setp.ge.s32	%p39, %r2, %r212;
	mov.f32 	%f298, %f284;
	@%p39 bra 	BB3_57;

	add.s32 	%r218, %r2, 2;
	mad.lo.s32 	%r226, %r218, %r3, %r1;
	cvt.s64.s32	%rd92, %r226;
	add.s64 	%rd97, %rd92, %rd2;
	shl.b64 	%rd99, %rd97, 2;
	add.s64 	%rd100, %rd1, %rd99;
	ld.global.f32 	%f57, [%rd100];
	setp.ltu.ftz.f32	%p41, %f57, 0f00000000;
	@%p41 bra 	BB3_56;
	bra.uni 	BB3_55;

BB3_56:
	neg.ftz.f32 	%f167, %f57;
	lg2.approx.ftz.f32 	%f168, %f167;
	mul.ftz.f32 	%f169, %f168, 0f3ED55555;
	ex2.approx.ftz.f32 	%f170, %f169;
	neg.ftz.f32 	%f298, %f170;
	bra.uni 	BB3_57;

BB3_55:
	lg2.approx.ftz.f32 	%f165, %f57;
	mul.ftz.f32 	%f166, %f165, 0f3ED55555;
	ex2.approx.ftz.f32 	%f298, %f166;

BB3_57:
	mov.f32 	%f299, %f285;
	@%p39 bra 	BB3_61;

	add.s32 	%r240, %r2, 2;
	mad.lo.s32 	%r248, %r240, %r3, %r1;
	add.s32 	%r249, %r248, 1;
	cvt.s64.s32	%rd101, %r249;
	add.s64 	%rd106, %rd101, %rd2;
	shl.b64 	%rd108, %rd106, 2;
	add.s64 	%rd109, %rd1, %rd108;
	ld.global.f32 	%f61, [%rd109];
	setp.ltu.ftz.f32	%p44, %f61, 0f00000000;
	@%p44 bra 	BB3_60;
	bra.uni 	BB3_59;

BB3_60:
	neg.ftz.f32 	%f173, %f61;
	lg2.approx.ftz.f32 	%f174, %f173;
	mul.ftz.f32 	%f175, %f174, 0f3ED55555;
	ex2.approx.ftz.f32 	%f176, %f175;
	neg.ftz.f32 	%f299, %f176;
	bra.uni 	BB3_61;

BB3_59:
	lg2.approx.ftz.f32 	%f171, %f61;
	mul.ftz.f32 	%f172, %f171, 0f3ED55555;
	ex2.approx.ftz.f32 	%f299, %f172;

BB3_61:
	or.pred  	%p47, %p39, %p13;
	mov.f32 	%f300, %f284;
	@%p47 bra 	BB3_65;

	add.s32 	%r269, %r2, 2;
	mad.lo.s32 	%r277, %r269, %r3, %r1;
	add.s32 	%r278, %r277, 1;
	cvt.s64.s32	%rd111, %r278;
	add.s64 	%rd116, %rd111, %rd2;
	shl.b64 	%rd117, %rd116, 2;
	add.s64 	%rd118, %rd1, %rd117;
	ld.global.f32 	%f65, [%rd118+4];
	setp.ltu.ftz.f32	%p49, %f65, 0f00000000;
	@%p49 bra 	BB3_64;
	bra.uni 	BB3_63;

BB3_64:
	neg.ftz.f32 	%f179, %f65;
	lg2.approx.ftz.f32 	%f180, %f179;
	mul.ftz.f32 	%f181, %f180, 0f3ED55555;
	ex2.approx.ftz.f32 	%f182, %f181;
	neg.ftz.f32 	%f300, %f182;
	bra.uni 	BB3_65;

BB3_63:
	lg2.approx.ftz.f32 	%f177, %f65;
	mul.ftz.f32 	%f178, %f177, 0f3ED55555;
	ex2.approx.ftz.f32 	%f300, %f178;

BB3_65:
	add.s32 	%r286, %r17, -3;
	setp.ge.s32	%p50, %r2, %r286;
	mov.f32 	%f301, %f287;
	@%p50 bra 	BB3_69;

	add.s32 	%r292, %r2, 3;
	mad.lo.s32 	%r300, %r292, %r3, %r1;
	add.s32 	%r301, %r300, 1;
	cvt.s64.s32	%rd119, %r301;
	add.s64 	%rd124, %rd119, %rd2;
	shl.b64 	%rd126, %rd124, 2;
	add.s64 	%rd127, %rd1, %rd126;
	ld.global.f32 	%f69, [%rd127];
	setp.ltu.ftz.f32	%p52, %f69, 0f00000000;
	@%p52 bra 	BB3_68;
	bra.uni 	BB3_67;

BB3_68:
	neg.ftz.f32 	%f185, %f69;
	lg2.approx.ftz.f32 	%f186, %f185;
	mul.ftz.f32 	%f187, %f186, 0f3ED55555;
	ex2.approx.ftz.f32 	%f188, %f187;
	neg.ftz.f32 	%f301, %f188;
	bra.uni 	BB3_69;

BB3_67:
	lg2.approx.ftz.f32 	%f183, %f69;
	mul.ftz.f32 	%f184, %f183, 0f3ED55555;
	ex2.approx.ftz.f32 	%f301, %f184;

BB3_69:
	sub.ftz.f32 	%f189, %f284, %f298;
	sub.ftz.f32 	%f190, %f284, %f297;
	add.ftz.f32 	%f191, %f190, %f189;
	sub.ftz.f32 	%f192, %f284, %f291;
	sub.ftz.f32 	%f193, %f284, %f293;
	add.ftz.f32 	%f194, %f192, %f193;
	add.ftz.f32 	%f195, %f286, %f295;
	add.ftz.f32 	%f196, %f285, %f292;
	mul.ftz.f32 	%f197, %f191, 0f3E800000;
	fma.rn.ftz.f32 	%f198, %f195, 0f3F000000, %f197;
	mul.ftz.f32 	%f199, %f194, 0f3E800000;
	fma.rn.ftz.f32 	%f200, %f196, 0f3F000000, %f199;
	add.ftz.f32 	%f201, %f200, %f198;
	mul.ftz.f32 	%f202, %f201, 0f3F000000;
	add.ftz.f32 	%f203, %f286, %f292;
	add.ftz.f32 	%f204, %f203, %f295;
	add.ftz.f32 	%f205, %f285, %f204;
	add.ftz.f32 	%f206, %f205, %f298;
	add.ftz.f32 	%f207, %f291, %f206;
	add.ftz.f32 	%f208, %f297, %f207;
	add.ftz.f32 	%f209, %f293, %f208;
	mul.ftz.f32 	%f210, %f209, 0f3C4CCCCD;
	sub.ftz.f32 	%f211, %f286, %f295;
	abs.ftz.f32 	%f212, %f211;
	abs.ftz.f32 	%f213, %f191;
	add.ftz.f32 	%f214, %f212, %f213;
	sub.ftz.f32 	%f215, %f292, %f285;
	abs.ftz.f32 	%f216, %f215;
	abs.ftz.f32 	%f217, %f194;
	add.ftz.f32 	%f218, %f216, %f217;
	sub.ftz.f32 	%f219, %f214, %f218;
	setp.lt.ftz.f32	%p53, %f219, 0f00000000;
	selp.f32	%f220, %f198, %f200, %p53;
	abs.ftz.f32 	%f221, %f219;
	setp.lt.ftz.f32	%p54, %f221, %f210;
	selp.f32	%f73, %f202, %f220, %p54;
	sub.ftz.f32 	%f222, %f287, %f301;
	sub.ftz.f32 	%f223, %f287, %f296;
	add.ftz.f32 	%f224, %f223, %f222;
	sub.ftz.f32 	%f225, %f287, %f288;
	sub.ftz.f32 	%f226, %f287, %f290;
	add.ftz.f32 	%f227, %f225, %f226;
	add.ftz.f32 	%f228, %f285, %f299;
	add.ftz.f32 	%f229, %f286, %f289;
	mul.ftz.f32 	%f230, %f224, 0f3E800000;
	fma.rn.ftz.f32 	%f231, %f228, 0f3F000000, %f230;
	mul.ftz.f32 	%f232, %f227, 0f3E800000;
	fma.rn.ftz.f32 	%f233, %f229, 0f3F000000, %f232;
	add.ftz.f32 	%f234, %f233, %f231;
	mul.ftz.f32 	%f235, %f234, 0f3F000000;
	add.ftz.f32 	%f236, %f286, %f299;
	add.ftz.f32 	%f237, %f285, %f236;
	add.ftz.f32 	%f238, %f289, %f237;
	add.ftz.f32 	%f239, %f238, %f301;
	add.ftz.f32 	%f240, %f288, %f239;
	add.ftz.f32 	%f241, %f296, %f240;
	add.ftz.f32 	%f242, %f290, %f241;
	mul.ftz.f32 	%f243, %f242, 0f3C4CCCCD;
	sub.ftz.f32 	%f244, %f299, %f285;
	abs.ftz.f32 	%f245, %f244;
	abs.ftz.f32 	%f246, %f224;
	add.ftz.f32 	%f247, %f245, %f246;
	sub.ftz.f32 	%f248, %f286, %f289;
	abs.ftz.f32 	%f249, %f248;
	abs.ftz.f32 	%f250, %f227;
	add.ftz.f32 	%f251, %f249, %f250;
	sub.ftz.f32 	%f252, %f247, %f251;
	setp.lt.ftz.f32	%p55, %f252, 0f00000000;
	selp.f32	%f253, %f231, %f233, %p55;
	abs.ftz.f32 	%f254, %f252;
	setp.lt.ftz.f32	%p56, %f254, %f243;
	selp.f32	%f74, %f235, %f253, %p56;
	add.ftz.f32 	%f255, %f294, %f296;
	add.ftz.f32 	%f256, %f288, %f255;
	add.ftz.f32 	%f257, %f287, %f256;
	mul.ftz.f32 	%f75, %f257, 0f3E800000;
	add.ftz.f32 	%f258, %f287, %f296;
	mul.ftz.f32 	%f76, %f258, 0f3F000000;
	add.ftz.f32 	%f259, %f284, %f293;
	mul.ftz.f32 	%f77, %f259, 0f3F000000;
	add.ftz.f32 	%f260, %f287, %f288;
	mul.ftz.f32 	%f78, %f260, 0f3F000000;
	add.ftz.f32 	%f261, %f284, %f298;
	mul.ftz.f32 	%f79, %f261, 0f3F000000;
	add.ftz.f32 	%f262, %f259, %f298;
	add.ftz.f32 	%f263, %f262, %f300;
	mul.ftz.f32 	%f80, %f263, 0f3E800000;
	mul.lo.s32 	%r308, %r25, %r14;
	shl.b32 	%r5, %r308, 1;
	add.s32 	%r6, %r5, %r1;
	setp.eq.s32	%p57, %r15, 0;
	@%p57 bra 	BB3_71;

	cvta.to.global.u64 	%rd128, %rd6;
	mul.wide.s32 	%rd129, %r6, 16;
	add.s64 	%rd130, %rd128, %rd129;
	mov.f32 	%f264, 0f3F800000;
	st.global.v4.f32 	[%rd130], {%f75, %f73, %f284, %f264};
	bra.uni 	BB3_72;

BB3_71:
	cvta.to.global.u64 	%rd131, %rd6;
	// inline asm
	{  cvt.rn.f16.f32 %rs1, %f75;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs2, %f73;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs3, %f284;}

	// inline asm
	mov.f32 	%f268, 0f3F800000;
	// inline asm
	{  cvt.rn.f16.f32 %rs4, %f268;}

	// inline asm
	mul.wide.s32 	%rd132, %r6, 8;
	add.s64 	%rd133, %rd131, %rd132;
	st.global.u16 	[%rd133], %rs1;
	st.global.u16 	[%rd133+2], %rs2;
	st.global.u16 	[%rd133+4], %rs3;
	st.global.u16 	[%rd133+6], %rs4;

BB3_72:
	add.s32 	%r319, %r1, %r5;
	add.s32 	%r7, %r319, 1;
	@%p57 bra 	BB3_74;

	cvta.to.global.u64 	%rd134, %rd6;
	mul.wide.s32 	%rd135, %r7, 16;
	add.s64 	%rd136, %rd134, %rd135;
	mov.f32 	%f269, 0f3F800000;
	st.global.v4.f32 	[%rd136], {%f76, %f285, %f77, %f269};
	bra.uni 	BB3_75;

BB3_74:
	cvta.to.global.u64 	%rd137, %rd6;
	// inline asm
	{  cvt.rn.f16.f32 %rs5, %f76;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs6, %f285;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs7, %f77;}

	// inline asm
	mov.f32 	%f273, 0f3F800000;
	// inline asm
	{  cvt.rn.f16.f32 %rs8, %f273;}

	// inline asm
	mul.wide.s32 	%rd138, %r7, 8;
	add.s64 	%rd139, %rd137, %rd138;
	st.global.u16 	[%rd139], %rs5;
	st.global.u16 	[%rd139+2], %rs6;
	st.global.u16 	[%rd139+4], %rs7;
	st.global.u16 	[%rd139+6], %rs8;

BB3_75:
	mul.lo.s32 	%r8, %r31, %r14;
	add.s32 	%r9, %r8, %r1;
	@%p57 bra 	BB3_77;

	cvta.to.global.u64 	%rd140, %rd6;
	mul.wide.s32 	%rd141, %r9, 16;
	add.s64 	%rd142, %rd140, %rd141;
	mov.f32 	%f274, 0f3F800000;
	st.global.v4.f32 	[%rd142], {%f78, %f286, %f79, %f274};
	bra.uni 	BB3_78;

BB3_77:
	cvta.to.global.u64 	%rd143, %rd6;
	// inline asm
	{  cvt.rn.f16.f32 %rs9, %f78;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs10, %f286;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs11, %f79;}

	// inline asm
	mov.f32 	%f278, 0f3F800000;
	// inline asm
	{  cvt.rn.f16.f32 %rs12, %f278;}

	// inline asm
	mul.wide.s32 	%rd144, %r9, 8;
	add.s64 	%rd145, %rd143, %rd144;
	st.global.u16 	[%rd145], %rs9;
	st.global.u16 	[%rd145+2], %rs10;
	st.global.u16 	[%rd145+4], %rs11;
	st.global.u16 	[%rd145+6], %rs12;

BB3_78:
	add.s32 	%r336, %r1, %r8;
	add.s32 	%r10, %r336, 1;
	@%p57 bra 	BB3_80;

	cvta.to.global.u64 	%rd146, %rd6;
	mul.wide.s32 	%rd147, %r10, 16;
	add.s64 	%rd148, %rd146, %rd147;
	mov.f32 	%f279, 0f3F800000;
	st.global.v4.f32 	[%rd148], {%f287, %f74, %f80, %f279};
	bra.uni 	BB3_81;

BB3_80:
	cvta.to.global.u64 	%rd149, %rd6;
	// inline asm
	{  cvt.rn.f16.f32 %rs13, %f287;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs14, %f74;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs15, %f80;}

	// inline asm
	mov.f32 	%f283, 0f3F800000;
	// inline asm
	{  cvt.rn.f16.f32 %rs16, %f283;}

	// inline asm
	mul.wide.s32 	%rd150, %r10, 8;
	add.s64 	%rd151, %rd149, %rd150;
	st.global.u16 	[%rd151], %rs13;
	st.global.u16 	[%rd151+2], %rs14;
	st.global.u16 	[%rd151+4], %rs15;
	st.global.u16 	[%rd151+6], %rs16;

BB3_81:
	ret;
}

	// .globl	PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel
.visible .entry PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel(
	.param .u64 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_0,
	.param .u64 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_1,
	.param .u64 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_2,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_3,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_4,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_5,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_6,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_7,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_8,
	.param .align 16 .b8 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_9[16],
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_10,
	.param .u32 PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_11
)
{
	.reg .pred 	%p<62>;
	.reg .b16 	%rs<39>;
	.reg .f32 	%f<566>;
	.reg .b32 	%r<206>;
	.reg .b64 	%rd<98>;
	// demoted variable
	.shared .align 4 .b8 _ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix[36];

	ld.param.u64 	%rd5, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_0];
	ld.param.u64 	%rd6, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_1];
	ld.param.u64 	%rd7, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_2];
	ld.param.u32 	%r17, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_3];
	ld.param.u32 	%r18, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_4];
	ld.param.u32 	%r19, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_5];
	ld.param.u32 	%r20, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_6];
	ld.param.u32 	%r21, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_7];
	ld.param.u32 	%r22, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_8];
	ld.param.f32 	%f190, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_9+8];
	ld.param.f32 	%f189, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_9+4];
	ld.param.f32 	%f188, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_9];
	ld.param.u32 	%r23, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_10];
	ld.param.u32 	%r24, [PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel_param_11];
	cvta.to.global.u64 	%rd1, %rd5;
	mov.u32 	%r1, %tid.x;
	mov.u32 	%r25, %ntid.y;
	mov.u32 	%r26, %ctaid.y;
	mov.u32 	%r27, %tid.y;
	mad.lo.s32 	%r2, %r25, %r26, %r27;
	setp.ne.s32	%p1, %r27, 0;
	setp.gt.u32	%p2, %r1, 2;
	or.pred  	%p3, %p1, %p2;
	@%p3 bra 	BB4_2;

	cvta.to.global.u64 	%rd8, %rd7;
	cvt.s64.s32	%rd9, %r23;
	setp.ne.s32	%p4, %r22, 0;
	mul.lo.s32 	%r28, %r1, 3;
	cvt.s64.s32	%rd10, %r28;
	selp.b64	%rd11, 2, 0, %p4;
	add.s64 	%rd12, %rd9, %rd11;
	add.s64 	%rd13, %rd12, %rd10;
	shl.b64 	%rd14, %rd13, 2;
	add.s64 	%rd15, %rd8, %rd14;
	ld.global.f32 	%f192, [%rd15];
	shl.b32 	%r29, %r28, 2;
	mov.u32 	%r30, _ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix;
	add.s32 	%r31, %r30, %r29;
	st.volatile.shared.f32 	[%r31], %f192;
	add.s32 	%r32, %r23, %r28;
	mul.wide.s32 	%rd16, %r32, 4;
	add.s64 	%rd17, %rd8, %rd16;
	ld.global.f32 	%f193, [%rd17+4];
	st.volatile.shared.f32 	[%r31+4], %f193;
	selp.b64	%rd18, 0, 2, %p4;
	add.s64 	%rd19, %rd9, %rd18;
	add.s64 	%rd20, %rd19, %rd10;
	shl.b64 	%rd21, %rd20, 2;
	add.s64 	%rd22, %rd8, %rd21;
	ld.global.f32 	%f194, [%rd22];
	st.volatile.shared.f32 	[%r31+8], %f194;

BB4_2:
	bar.sync 	0;
	mov.u32 	%r33, %ctaid.x;
	mov.u32 	%r34, %ntid.x;
	mad.lo.s32 	%r35, %r34, %r33, %r1;
	shl.b32 	%r3, %r35, 1;
	setp.ge.s32	%p5, %r3, %r20;
	shl.b32 	%r4, %r2, 1;
	setp.ge.s32	%p6, %r4, %r21;
	or.pred  	%p7, %p5, %p6;
	@%p7 bra 	BB4_131;

	mul.lo.s32 	%r5, %r4, %r17;
	add.s32 	%r6, %r5, %r3;
	cvt.s64.s32	%rd2, %r6;
	setp.eq.s32	%p8, %r19, 0;
	@%p8 bra 	BB4_5;

	mul.wide.s32 	%rd23, %r6, 16;
	add.s64 	%rd24, %rd1, %rd23;
	ld.global.v4.f32 	{%f512, %f513, %f514, %f515}, [%rd24];
	bra.uni 	BB4_6;

BB4_5:
	mul.wide.s32 	%rd26, %r6, 8;
	add.s64 	%rd27, %rd1, %rd26;
	ld.global.u16 	%rs1, [%rd27];
	ld.global.u16 	%rs2, [%rd27+2];
	ld.global.u16 	%rs3, [%rd27+4];
	ld.global.u16 	%rs4, [%rd27+6];
	// inline asm
	{  cvt.f32.f16 %f512, %rs1;}

	// inline asm
	// inline asm
	{  cvt.f32.f16 %f513, %rs2;}

	// inline asm
	// inline asm
	{  cvt.f32.f16 %f514, %rs3;}

	// inline asm
	// inline asm
	{  cvt.f32.f16 %f515, %rs4;}

	// inline asm

BB4_6:
	mul.wide.s32 	%rd28, %r6, 16;
	add.s64 	%rd3, %rd1, %rd28;
	@%p8 bra 	BB4_8;

	ld.global.v4.f32 	{%f516, %f517, %f518, %f519}, [%rd3+16];
	bra.uni 	BB4_9;

BB4_8:
	add.s32 	%r37, %r3, %r5;
	add.s32 	%r38, %r37, 1;
	mul.wide.s32 	%rd30, %r38, 8;
	add.s64 	%rd31, %rd1, %rd30;
	ld.global.u16 	%rs5, [%rd31];
	ld.global.u16 	%rs6, [%rd31+2];
	ld.global.u16 	%rs7, [%rd31+4];
	ld.global.u16 	%rs8, [%rd31+6];
	// inline asm
	{  cvt.f32.f16 %f516, %rs5;}

	// inline asm
	// inline asm
	{  cvt.f32.f16 %f517, %rs6;}

	// inline asm
	// inline asm
	{  cvt.f32.f16 %f518, %rs7;}

	// inline asm
	// inline asm
	{  cvt.f32.f16 %f519, %rs8;}

	// inline asm

BB4_9:
	add.s32 	%r39, %r4, 1;
	mad.lo.s32 	%r7, %r39, %r17, %r3;
	@%p8 bra 	BB4_11;

	mul.wide.s32 	%rd33, %r7, 16;
	add.s64 	%rd34, %rd1, %rd33;
	ld.global.v4.f32 	{%f520, %f521, %f522, %f523}, [%rd34];
	bra.uni 	BB4_12;

BB4_11:
	mul.wide.s32 	%rd36, %r7, 8;
	add.s64 	%rd37, %rd1, %rd36;
	ld.global.u16 	%rs9, [%rd37];
	ld.global.u16 	%rs10, [%rd37+2];
	ld.global.u16 	%rs11, [%rd37+4];
	ld.global.u16 	%rs12, [%rd37+6];
	// inline asm
	{  cvt.f32.f16 %f520, %rs9;}

	// inline asm
	// inline asm
	{  cvt.f32.f16 %f521, %rs10;}

	// inline asm
	// inline asm
	{  cvt.f32.f16 %f522, %rs11;}

	// inline asm
	// inline asm
	{  cvt.f32.f16 %f523, %rs12;}

	// inline asm

BB4_12:
	@%p8 bra 	BB4_14;

	add.s32 	%r48, %r7, -1;
	mul.wide.s32 	%rd39, %r48, 16;
	add.s64 	%rd40, %rd1, %rd39;
	ld.global.v4.f32 	{%f524, %f525, %f526, %f527}, [%rd40+32];
	bra.uni 	BB4_15;

BB4_14:
	add.s32 	%r57, %r7, 1;
	mul.wide.s32 	%rd42, %r57, 8;
	add.s64 	%rd43, %rd1, %rd42;
	ld.global.u16 	%rs13, [%rd43];
	ld.global.u16 	%rs14, [%rd43+2];
	ld.global.u16 	%rs15, [%rd43+4];
	ld.global.u16 	%rs16, [%rd43+6];
	// inline asm
	{  cvt.f32.f16 %f524, %rs13;}

	// inline asm
	// inline asm
	{  cvt.f32.f16 %f525, %rs14;}

	// inline asm
	// inline asm
	{  cvt.f32.f16 %f526, %rs15;}

	// inline asm
	// inline asm
	{  cvt.f32.f16 %f527, %rs16;}

	// inline asm

BB4_15:
	add.s32 	%r63, %r20, -2;
	setp.ge.s32	%p12, %r3, %r63;
	mov.f32 	%f528, %f521;
	@%p12 bra 	BB4_19;

	@%p8 bra 	BB4_18;

	ld.global.f32 	%f528, [%rd3+36];
	bra.uni 	BB4_19;

BB4_18:
	cvt.u32.u64	%r64, %rd2;
	add.s32 	%r65, %r64, 2;
	mul.wide.s32 	%rd45, %r65, 8;
	add.s64 	%rd46, %rd1, %rd45;
	ld.global.u16 	%rs17, [%rd46+2];
	// inline asm
	{  cvt.f32.f16 %f528, %rs17;}

	// inline asm

BB4_19:
	add.s32 	%r71, %r21, -2;
	setp.ge.s32	%p14, %r4, %r71;
	mov.f32 	%f529, %f517;
	@%p14 bra 	BB4_23;

	add.s32 	%r77, %r4, 2;
	mad.lo.s32 	%r8, %r77, %r17, %r3;
	@%p8 bra 	BB4_22;

	mul.wide.s32 	%rd48, %r8, 16;
	add.s64 	%rd49, %rd1, %rd48;
	ld.global.f32 	%f529, [%rd49+4];
	bra.uni 	BB4_23;

BB4_22:
	mul.wide.s32 	%rd51, %r8, 8;
	add.s64 	%rd52, %rd1, %rd51;
	ld.global.u16 	%rs18, [%rd52+2];
	// inline asm
	{  cvt.f32.f16 %f529, %rs18;}

	// inline asm

BB4_23:
	or.pred  	%p18, %p12, %p14;
	mov.f32 	%f530, %f525;
	@%p18 bra 	BB4_27;

	add.s32 	%r105, %r4, 2;
	mad.lo.s32 	%r106, %r105, %r17, %r3;
	add.s32 	%r9, %r106, 2;
	@%p8 bra 	BB4_26;

	mul.wide.s32 	%rd54, %r9, 16;
	add.s64 	%rd55, %rd1, %rd54;
	ld.global.f32 	%f530, [%rd55+4];
	bra.uni 	BB4_27;

BB4_26:
	mul.wide.s32 	%rd57, %r9, 8;
	add.s64 	%rd58, %rd1, %rd57;
	ld.global.u16 	%rs19, [%rd58+2];
	// inline asm
	{  cvt.f32.f16 %f530, %rs19;}

	// inline asm

BB4_27:
	setp.lt.s32	%p20, %r2, 1;
	setp.lt.s32	%p21, %r35, 1;
	add.ftz.f32 	%f230, %f513, %f528;
	mul.ftz.f32 	%f231, %f230, 0f3F000000;
	sub.ftz.f32 	%f232, %f517, %f231;
	add.ftz.f32 	%f58, %f518, %f232;
	add.ftz.f32 	%f233, %f513, %f529;
	mul.ftz.f32 	%f234, %f233, 0f3F000000;
	sub.ftz.f32 	%f235, %f521, %f234;
	add.ftz.f32 	%f59, %f522, %f235;
	add.ftz.f32 	%f236, %f230, %f529;
	add.ftz.f32 	%f237, %f236, %f530;
	fma.rn.ftz.f32 	%f238, %f237, 0fBE800000, %f525;
	add.ftz.f32 	%f60, %f526, %f238;
	or.pred  	%p22, %p21, %p20;
	add.s32 	%r116, %r4, -1;
	mad.lo.s32 	%r118, %r116, %r17, %r3;
	add.s32 	%r10, %r118, -1;
	mul.wide.s32 	%rd60, %r10, 16;
	add.s64 	%rd61, %rd1, %rd60;
	add.s64 	%rd4, %rd61, 4;
	mov.f32 	%f531, %f525;
	@%p22 bra 	BB4_31;

	@%p8 bra 	BB4_30;

	ld.global.f32 	%f531, [%rd4];
	bra.uni 	BB4_31;

BB4_30:
	mul.wide.s32 	%rd63, %r10, 8;
	add.s64 	%rd64, %rd1, %rd63;
	ld.global.u16 	%rs20, [%rd64+2];
	// inline asm
	{  cvt.f32.f16 %f531, %rs20;}

	// inline asm

BB4_31:
	mov.f32 	%f532, %f517;
	@%p20 bra 	BB4_35;

	@%p8 bra 	BB4_34;

	ld.global.f32 	%f532, [%rd4+32];
	bra.uni 	BB4_35;

BB4_34:
	add.s32 	%r135, %r118, 1;
	mul.wide.s32 	%rd66, %r135, 8;
	add.s64 	%rd67, %rd1, %rd66;
	ld.global.u16 	%rs21, [%rd67+2];
	// inline asm
	{  cvt.f32.f16 %f532, %rs21;}

	// inline asm

BB4_35:
	mov.f32 	%f533, %f521;
	@%p21 bra 	BB4_39;

	@%p8 bra 	BB4_38;

	add.s32 	%r152, %r7, -1;
	mul.wide.s32 	%rd69, %r152, 16;
	add.s64 	%rd70, %rd1, %rd69;
	ld.global.f32 	%f533, [%rd70+4];
	bra.uni 	BB4_39;

BB4_38:
	add.s32 	%r165, %r7, -1;
	mul.wide.s32 	%rd72, %r165, 8;
	add.s64 	%rd73, %rd1, %rd72;
	ld.global.u16 	%rs22, [%rd73+2];
	// inline asm
	{  cvt.f32.f16 %f533, %rs22;}

	// inline asm

BB4_39:
	add.ftz.f32 	%f242, %f531, %f532;
	add.ftz.f32 	%f243, %f242, %f533;
	add.ftz.f32 	%f244, %f525, %f243;
	fma.rn.ftz.f32 	%f245, %f244, 0fBE800000, %f513;
	add.ftz.f32 	%f70, %f512, %f245;
	add.ftz.f32 	%f246, %f525, %f532;
	mul.ftz.f32 	%f247, %f246, 0f3F000000;
	sub.ftz.f32 	%f248, %f517, %f247;
	add.ftz.f32 	%f71, %f516, %f248;
	add.ftz.f32 	%f249, %f525, %f533;
	mul.ftz.f32 	%f250, %f249, 0f3F000000;
	sub.ftz.f32 	%f251, %f521, %f250;
	add.ftz.f32 	%f72, %f520, %f251;
	setp.ltu.ftz.f32	%p28, %f514, 0f00000000;
	@%p28 bra 	BB4_41;
	bra.uni 	BB4_40;

BB4_41:
	neg.ftz.f32 	%f254, %f514;
	lg2.approx.ftz.f32 	%f255, %f254;
	mul.ftz.f32 	%f256, %f255, 0f4019999A;
	ex2.approx.ftz.f32 	%f257, %f256;
	neg.ftz.f32 	%f534, %f257;
	bra.uni 	BB4_42;

BB4_40:
	lg2.approx.ftz.f32 	%f252, %f514;
	mul.ftz.f32 	%f253, %f252, 0f4019999A;
	ex2.approx.ftz.f32 	%f534, %f253;

BB4_42:
	setp.ltu.ftz.f32	%p29, %f513, 0f00000000;
	@%p29 bra 	BB4_44;
	bra.uni 	BB4_43;

BB4_44:
	neg.ftz.f32 	%f260, %f513;
	lg2.approx.ftz.f32 	%f261, %f260;
	mul.ftz.f32 	%f262, %f261, 0f4019999A;
	ex2.approx.ftz.f32 	%f263, %f262;
	neg.ftz.f32 	%f535, %f263;
	bra.uni 	BB4_45;

BB4_43:
	lg2.approx.ftz.f32 	%f258, %f513;
	mul.ftz.f32 	%f259, %f258, 0f4019999A;
	ex2.approx.ftz.f32 	%f535, %f259;

BB4_45:
	setp.ltu.ftz.f32	%p30, %f70, 0f00000000;
	@%p30 bra 	BB4_47;
	bra.uni 	BB4_46;

BB4_47:
	neg.ftz.f32 	%f266, %f70;
	lg2.approx.ftz.f32 	%f267, %f266;
	mul.ftz.f32 	%f268, %f267, 0f4019999A;
	ex2.approx.ftz.f32 	%f269, %f268;
	neg.ftz.f32 	%f536, %f269;
	bra.uni 	BB4_48;

BB4_46:
	lg2.approx.ftz.f32 	%f264, %f70;
	mul.ftz.f32 	%f265, %f264, 0f4019999A;
	ex2.approx.ftz.f32 	%f536, %f265;

BB4_48:
	min.ftz.f32 	%f83, %f534, %f188;
	min.ftz.f32 	%f85, %f535, %f189;
	min.ftz.f32 	%f87, %f536, %f190;
	ld.volatile.shared.f32 	%f270, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+24];
	ld.volatile.shared.f32 	%f271, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+28];
	mul.ftz.f32 	%f272, %f85, %f271;
	fma.rn.ftz.f32 	%f273, %f83, %f270, %f272;
	ld.volatile.shared.f32 	%f274, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+32];
	fma.rn.ftz.f32 	%f539, %f87, %f274, %f273;
	setp.eq.s32	%p31, %r24, 0;
	@%p31 bra 	BB4_58;

	setp.ltu.ftz.f32	%p32, %f539, 0f00000000;
	@%p32 bra 	BB4_51;
	bra.uni 	BB4_50;

BB4_51:
	neg.ftz.f32 	%f277, %f539;
	lg2.approx.ftz.f32 	%f278, %f277;
	mul.ftz.f32 	%f279, %f278, 0f3ED55555;
	ex2.approx.ftz.f32 	%f280, %f279;
	neg.ftz.f32 	%f539, %f280;
	bra.uni 	BB4_52;

BB4_58:
	ld.volatile.shared.f32 	%f303, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f304, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+16];
	mul.ftz.f32 	%f305, %f85, %f304;
	fma.rn.ftz.f32 	%f306, %f83, %f303, %f305;
	ld.volatile.shared.f32 	%f307, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f540, %f87, %f307, %f306;
	ld.volatile.shared.f32 	%f308, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix];
	ld.volatile.shared.f32 	%f309, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+4];
	mul.ftz.f32 	%f310, %f85, %f309;
	fma.rn.ftz.f32 	%f311, %f83, %f308, %f310;
	ld.volatile.shared.f32 	%f312, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f541, %f87, %f312, %f311;
	bra.uni 	BB4_59;

BB4_50:
	lg2.approx.ftz.f32 	%f275, %f539;
	mul.ftz.f32 	%f276, %f275, 0f3ED55555;
	ex2.approx.ftz.f32 	%f539, %f276;

BB4_52:
	ld.volatile.shared.f32 	%f281, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f282, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+16];
	mul.ftz.f32 	%f283, %f85, %f282;
	fma.rn.ftz.f32 	%f284, %f83, %f281, %f283;
	ld.volatile.shared.f32 	%f285, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f92, %f87, %f285, %f284;
	setp.ltu.ftz.f32	%p33, %f92, 0f00000000;
	@%p33 bra 	BB4_54;
	bra.uni 	BB4_53;

BB4_54:
	neg.ftz.f32 	%f288, %f92;
	lg2.approx.ftz.f32 	%f289, %f288;
	mul.ftz.f32 	%f290, %f289, 0f3ED55555;
	ex2.approx.ftz.f32 	%f291, %f290;
	neg.ftz.f32 	%f540, %f291;
	bra.uni 	BB4_55;

BB4_53:
	lg2.approx.ftz.f32 	%f286, %f92;
	mul.ftz.f32 	%f287, %f286, 0f3ED55555;
	ex2.approx.ftz.f32 	%f540, %f287;

BB4_55:
	ld.volatile.shared.f32 	%f292, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix];
	ld.volatile.shared.f32 	%f293, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+4];
	mul.ftz.f32 	%f294, %f85, %f293;
	fma.rn.ftz.f32 	%f295, %f83, %f292, %f294;
	ld.volatile.shared.f32 	%f296, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f96, %f87, %f296, %f295;
	setp.ltu.ftz.f32	%p34, %f96, 0f00000000;
	@%p34 bra 	BB4_57;
	bra.uni 	BB4_56;

BB4_57:
	neg.ftz.f32 	%f299, %f96;
	lg2.approx.ftz.f32 	%f300, %f299;
	mul.ftz.f32 	%f301, %f300, 0f3ED55555;
	ex2.approx.ftz.f32 	%f302, %f301;
	neg.ftz.f32 	%f541, %f302;
	bra.uni 	BB4_59;

BB4_56:
	lg2.approx.ftz.f32 	%f297, %f96;
	mul.ftz.f32 	%f298, %f297, 0f3ED55555;
	ex2.approx.ftz.f32 	%f541, %f298;

BB4_59:
	setp.ltu.ftz.f32	%p35, %f58, 0f00000000;
	@%p35 bra 	BB4_61;
	bra.uni 	BB4_60;

BB4_61:
	neg.ftz.f32 	%f315, %f58;
	lg2.approx.ftz.f32 	%f316, %f315;
	mul.ftz.f32 	%f317, %f316, 0f4019999A;
	ex2.approx.ftz.f32 	%f318, %f317;
	neg.ftz.f32 	%f542, %f318;
	bra.uni 	BB4_62;

BB4_60:
	lg2.approx.ftz.f32 	%f313, %f58;
	mul.ftz.f32 	%f314, %f313, 0f4019999A;
	ex2.approx.ftz.f32 	%f542, %f314;

BB4_62:
	setp.ltu.ftz.f32	%p36, %f517, 0f00000000;
	@%p36 bra 	BB4_64;
	bra.uni 	BB4_63;

BB4_64:
	neg.ftz.f32 	%f321, %f517;
	lg2.approx.ftz.f32 	%f322, %f321;
	mul.ftz.f32 	%f323, %f322, 0f4019999A;
	ex2.approx.ftz.f32 	%f324, %f323;
	neg.ftz.f32 	%f543, %f324;
	bra.uni 	BB4_65;

BB4_63:
	lg2.approx.ftz.f32 	%f319, %f517;
	mul.ftz.f32 	%f320, %f319, 0f4019999A;
	ex2.approx.ftz.f32 	%f543, %f320;

BB4_65:
	setp.ltu.ftz.f32	%p37, %f71, 0f00000000;
	@%p37 bra 	BB4_67;
	bra.uni 	BB4_66;

BB4_67:
	neg.ftz.f32 	%f327, %f71;
	lg2.approx.ftz.f32 	%f328, %f327;
	mul.ftz.f32 	%f329, %f328, 0f4019999A;
	ex2.approx.ftz.f32 	%f330, %f329;
	neg.ftz.f32 	%f544, %f330;
	bra.uni 	BB4_68;

BB4_66:
	lg2.approx.ftz.f32 	%f325, %f71;
	mul.ftz.f32 	%f326, %f325, 0f4019999A;
	ex2.approx.ftz.f32 	%f544, %f326;

BB4_68:
	ld.volatile.shared.f32 	%f331, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+24];
	min.ftz.f32 	%f113, %f542, %f188;
	ld.volatile.shared.f32 	%f332, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+28];
	min.ftz.f32 	%f114, %f543, %f189;
	mul.ftz.f32 	%f333, %f114, %f332;
	fma.rn.ftz.f32 	%f334, %f113, %f331, %f333;
	ld.volatile.shared.f32 	%f335, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+32];
	min.ftz.f32 	%f115, %f544, %f190;
	fma.rn.ftz.f32 	%f547, %f115, %f335, %f334;
	@%p31 bra 	BB4_78;

	setp.ltu.ftz.f32	%p39, %f547, 0f00000000;
	@%p39 bra 	BB4_71;
	bra.uni 	BB4_70;

BB4_71:
	neg.ftz.f32 	%f338, %f547;
	lg2.approx.ftz.f32 	%f339, %f338;
	mul.ftz.f32 	%f340, %f339, 0f3ED55555;
	ex2.approx.ftz.f32 	%f341, %f340;
	neg.ftz.f32 	%f547, %f341;
	bra.uni 	BB4_72;

BB4_78:
	ld.volatile.shared.f32 	%f364, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f365, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+16];
	mul.ftz.f32 	%f366, %f114, %f365;
	fma.rn.ftz.f32 	%f367, %f113, %f364, %f366;
	ld.volatile.shared.f32 	%f368, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f548, %f115, %f368, %f367;
	ld.volatile.shared.f32 	%f369, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix];
	ld.volatile.shared.f32 	%f370, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+4];
	mul.ftz.f32 	%f371, %f114, %f370;
	fma.rn.ftz.f32 	%f372, %f113, %f369, %f371;
	ld.volatile.shared.f32 	%f373, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f549, %f115, %f373, %f372;
	bra.uni 	BB4_79;

BB4_70:
	lg2.approx.ftz.f32 	%f336, %f547;
	mul.ftz.f32 	%f337, %f336, 0f3ED55555;
	ex2.approx.ftz.f32 	%f547, %f337;

BB4_72:
	ld.volatile.shared.f32 	%f342, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f343, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+16];
	mul.ftz.f32 	%f344, %f114, %f343;
	fma.rn.ftz.f32 	%f345, %f113, %f342, %f344;
	ld.volatile.shared.f32 	%f346, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f120, %f115, %f346, %f345;
	setp.ltu.ftz.f32	%p40, %f120, 0f00000000;
	@%p40 bra 	BB4_74;
	bra.uni 	BB4_73;

BB4_74:
	neg.ftz.f32 	%f349, %f120;
	lg2.approx.ftz.f32 	%f350, %f349;
	mul.ftz.f32 	%f351, %f350, 0f3ED55555;
	ex2.approx.ftz.f32 	%f352, %f351;
	neg.ftz.f32 	%f548, %f352;
	bra.uni 	BB4_75;

BB4_73:
	lg2.approx.ftz.f32 	%f347, %f120;
	mul.ftz.f32 	%f348, %f347, 0f3ED55555;
	ex2.approx.ftz.f32 	%f548, %f348;

BB4_75:
	ld.volatile.shared.f32 	%f353, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix];
	ld.volatile.shared.f32 	%f354, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+4];
	mul.ftz.f32 	%f355, %f114, %f354;
	fma.rn.ftz.f32 	%f356, %f113, %f353, %f355;
	ld.volatile.shared.f32 	%f357, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f124, %f115, %f357, %f356;
	setp.ltu.ftz.f32	%p41, %f124, 0f00000000;
	@%p41 bra 	BB4_77;
	bra.uni 	BB4_76;

BB4_77:
	neg.ftz.f32 	%f360, %f124;
	lg2.approx.ftz.f32 	%f361, %f360;
	mul.ftz.f32 	%f362, %f361, 0f3ED55555;
	ex2.approx.ftz.f32 	%f363, %f362;
	neg.ftz.f32 	%f549, %f363;
	bra.uni 	BB4_79;

BB4_76:
	lg2.approx.ftz.f32 	%f358, %f124;
	mul.ftz.f32 	%f359, %f358, 0f3ED55555;
	ex2.approx.ftz.f32 	%f549, %f359;

BB4_79:
	setp.ltu.ftz.f32	%p42, %f59, 0f00000000;
	@%p42 bra 	BB4_81;
	bra.uni 	BB4_80;

BB4_81:
	neg.ftz.f32 	%f376, %f59;
	lg2.approx.ftz.f32 	%f377, %f376;
	mul.ftz.f32 	%f378, %f377, 0f4019999A;
	ex2.approx.ftz.f32 	%f379, %f378;
	neg.ftz.f32 	%f550, %f379;
	bra.uni 	BB4_82;

BB4_80:
	lg2.approx.ftz.f32 	%f374, %f59;
	mul.ftz.f32 	%f375, %f374, 0f4019999A;
	ex2.approx.ftz.f32 	%f550, %f375;

BB4_82:
	setp.ltu.ftz.f32	%p43, %f521, 0f00000000;
	@%p43 bra 	BB4_84;
	bra.uni 	BB4_83;

BB4_84:
	neg.ftz.f32 	%f382, %f521;
	lg2.approx.ftz.f32 	%f383, %f382;
	mul.ftz.f32 	%f384, %f383, 0f4019999A;
	ex2.approx.ftz.f32 	%f385, %f384;
	neg.ftz.f32 	%f551, %f385;
	bra.uni 	BB4_85;

BB4_83:
	lg2.approx.ftz.f32 	%f380, %f521;
	mul.ftz.f32 	%f381, %f380, 0f4019999A;
	ex2.approx.ftz.f32 	%f551, %f381;

BB4_85:
	setp.ltu.ftz.f32	%p44, %f72, 0f00000000;
	@%p44 bra 	BB4_87;
	bra.uni 	BB4_86;

BB4_87:
	neg.ftz.f32 	%f388, %f72;
	lg2.approx.ftz.f32 	%f389, %f388;
	mul.ftz.f32 	%f390, %f389, 0f4019999A;
	ex2.approx.ftz.f32 	%f391, %f390;
	neg.ftz.f32 	%f552, %f391;
	bra.uni 	BB4_88;

BB4_86:
	lg2.approx.ftz.f32 	%f386, %f72;
	mul.ftz.f32 	%f387, %f386, 0f4019999A;
	ex2.approx.ftz.f32 	%f552, %f387;

BB4_88:
	ld.volatile.shared.f32 	%f392, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+24];
	min.ftz.f32 	%f141, %f550, %f188;
	ld.volatile.shared.f32 	%f393, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+28];
	min.ftz.f32 	%f142, %f551, %f189;
	mul.ftz.f32 	%f394, %f142, %f393;
	fma.rn.ftz.f32 	%f395, %f141, %f392, %f394;
	ld.volatile.shared.f32 	%f396, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+32];
	min.ftz.f32 	%f143, %f552, %f190;
	fma.rn.ftz.f32 	%f555, %f143, %f396, %f395;
	@%p31 bra 	BB4_98;

	setp.ltu.ftz.f32	%p46, %f555, 0f00000000;
	@%p46 bra 	BB4_91;
	bra.uni 	BB4_90;

BB4_91:
	neg.ftz.f32 	%f399, %f555;
	lg2.approx.ftz.f32 	%f400, %f399;
	mul.ftz.f32 	%f401, %f400, 0f3ED55555;
	ex2.approx.ftz.f32 	%f402, %f401;
	neg.ftz.f32 	%f555, %f402;
	bra.uni 	BB4_92;

BB4_98:
	ld.volatile.shared.f32 	%f425, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f426, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+16];
	mul.ftz.f32 	%f427, %f142, %f426;
	fma.rn.ftz.f32 	%f428, %f141, %f425, %f427;
	ld.volatile.shared.f32 	%f429, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f556, %f143, %f429, %f428;
	ld.volatile.shared.f32 	%f430, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix];
	ld.volatile.shared.f32 	%f431, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+4];
	mul.ftz.f32 	%f432, %f142, %f431;
	fma.rn.ftz.f32 	%f433, %f141, %f430, %f432;
	ld.volatile.shared.f32 	%f434, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f557, %f143, %f434, %f433;
	bra.uni 	BB4_99;

BB4_90:
	lg2.approx.ftz.f32 	%f397, %f555;
	mul.ftz.f32 	%f398, %f397, 0f3ED55555;
	ex2.approx.ftz.f32 	%f555, %f398;

BB4_92:
	ld.volatile.shared.f32 	%f403, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f404, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+16];
	mul.ftz.f32 	%f405, %f142, %f404;
	fma.rn.ftz.f32 	%f406, %f141, %f403, %f405;
	ld.volatile.shared.f32 	%f407, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f148, %f143, %f407, %f406;
	setp.ltu.ftz.f32	%p47, %f148, 0f00000000;
	@%p47 bra 	BB4_94;
	bra.uni 	BB4_93;

BB4_94:
	neg.ftz.f32 	%f410, %f148;
	lg2.approx.ftz.f32 	%f411, %f410;
	mul.ftz.f32 	%f412, %f411, 0f3ED55555;
	ex2.approx.ftz.f32 	%f413, %f412;
	neg.ftz.f32 	%f556, %f413;
	bra.uni 	BB4_95;

BB4_93:
	lg2.approx.ftz.f32 	%f408, %f148;
	mul.ftz.f32 	%f409, %f408, 0f3ED55555;
	ex2.approx.ftz.f32 	%f556, %f409;

BB4_95:
	ld.volatile.shared.f32 	%f414, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix];
	ld.volatile.shared.f32 	%f415, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+4];
	mul.ftz.f32 	%f416, %f142, %f415;
	fma.rn.ftz.f32 	%f417, %f141, %f414, %f416;
	ld.volatile.shared.f32 	%f418, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f152, %f143, %f418, %f417;
	setp.ltu.ftz.f32	%p48, %f152, 0f00000000;
	@%p48 bra 	BB4_97;
	bra.uni 	BB4_96;

BB4_97:
	neg.ftz.f32 	%f421, %f152;
	lg2.approx.ftz.f32 	%f422, %f421;
	mul.ftz.f32 	%f423, %f422, 0f3ED55555;
	ex2.approx.ftz.f32 	%f424, %f423;
	neg.ftz.f32 	%f557, %f424;
	bra.uni 	BB4_99;

BB4_96:
	lg2.approx.ftz.f32 	%f419, %f152;
	mul.ftz.f32 	%f420, %f419, 0f3ED55555;
	ex2.approx.ftz.f32 	%f557, %f420;

BB4_99:
	setp.ltu.ftz.f32	%p49, %f60, 0f00000000;
	@%p49 bra 	BB4_101;
	bra.uni 	BB4_100;

BB4_101:
	neg.ftz.f32 	%f437, %f60;
	lg2.approx.ftz.f32 	%f438, %f437;
	mul.ftz.f32 	%f439, %f438, 0f4019999A;
	ex2.approx.ftz.f32 	%f440, %f439;
	neg.ftz.f32 	%f558, %f440;
	bra.uni 	BB4_102;

BB4_100:
	lg2.approx.ftz.f32 	%f435, %f60;
	mul.ftz.f32 	%f436, %f435, 0f4019999A;
	ex2.approx.ftz.f32 	%f558, %f436;

BB4_102:
	setp.ltu.ftz.f32	%p50, %f525, 0f00000000;
	@%p50 bra 	BB4_104;
	bra.uni 	BB4_103;

BB4_104:
	neg.ftz.f32 	%f443, %f525;
	lg2.approx.ftz.f32 	%f444, %f443;
	mul.ftz.f32 	%f445, %f444, 0f4019999A;
	ex2.approx.ftz.f32 	%f446, %f445;
	neg.ftz.f32 	%f559, %f446;
	bra.uni 	BB4_105;

BB4_103:
	lg2.approx.ftz.f32 	%f441, %f525;
	mul.ftz.f32 	%f442, %f441, 0f4019999A;
	ex2.approx.ftz.f32 	%f559, %f442;

BB4_105:
	setp.ltu.ftz.f32	%p51, %f524, 0f00000000;
	@%p51 bra 	BB4_107;
	bra.uni 	BB4_106;

BB4_107:
	neg.ftz.f32 	%f449, %f524;
	lg2.approx.ftz.f32 	%f450, %f449;
	mul.ftz.f32 	%f451, %f450, 0f4019999A;
	ex2.approx.ftz.f32 	%f452, %f451;
	neg.ftz.f32 	%f560, %f452;
	bra.uni 	BB4_108;

BB4_106:
	lg2.approx.ftz.f32 	%f447, %f524;
	mul.ftz.f32 	%f448, %f447, 0f4019999A;
	ex2.approx.ftz.f32 	%f560, %f448;

BB4_108:
	ld.volatile.shared.f32 	%f453, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+24];
	min.ftz.f32 	%f169, %f558, %f188;
	ld.volatile.shared.f32 	%f454, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+28];
	min.ftz.f32 	%f170, %f559, %f189;
	mul.ftz.f32 	%f455, %f170, %f454;
	fma.rn.ftz.f32 	%f456, %f169, %f453, %f455;
	ld.volatile.shared.f32 	%f457, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+32];
	min.ftz.f32 	%f171, %f560, %f190;
	fma.rn.ftz.f32 	%f563, %f171, %f457, %f456;
	@%p31 bra 	BB4_118;

	setp.ltu.ftz.f32	%p53, %f563, 0f00000000;
	@%p53 bra 	BB4_111;
	bra.uni 	BB4_110;

BB4_111:
	neg.ftz.f32 	%f460, %f563;
	lg2.approx.ftz.f32 	%f461, %f460;
	mul.ftz.f32 	%f462, %f461, 0f3ED55555;
	ex2.approx.ftz.f32 	%f463, %f462;
	neg.ftz.f32 	%f563, %f463;
	bra.uni 	BB4_112;

BB4_118:
	ld.volatile.shared.f32 	%f486, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f487, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+16];
	mul.ftz.f32 	%f488, %f170, %f487;
	fma.rn.ftz.f32 	%f489, %f169, %f486, %f488;
	ld.volatile.shared.f32 	%f490, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f564, %f171, %f490, %f489;
	ld.volatile.shared.f32 	%f491, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix];
	ld.volatile.shared.f32 	%f492, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+4];
	mul.ftz.f32 	%f493, %f170, %f492;
	fma.rn.ftz.f32 	%f494, %f169, %f491, %f493;
	ld.volatile.shared.f32 	%f495, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f565, %f171, %f495, %f494;
	bra.uni 	BB4_119;

BB4_110:
	lg2.approx.ftz.f32 	%f458, %f563;
	mul.ftz.f32 	%f459, %f458, 0f3ED55555;
	ex2.approx.ftz.f32 	%f563, %f459;

BB4_112:
	ld.volatile.shared.f32 	%f464, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+12];
	ld.volatile.shared.f32 	%f465, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+16];
	mul.ftz.f32 	%f466, %f170, %f465;
	fma.rn.ftz.f32 	%f467, %f169, %f464, %f466;
	ld.volatile.shared.f32 	%f468, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+20];
	fma.rn.ftz.f32 	%f176, %f171, %f468, %f467;
	setp.ltu.ftz.f32	%p54, %f176, 0f00000000;
	@%p54 bra 	BB4_114;
	bra.uni 	BB4_113;

BB4_114:
	neg.ftz.f32 	%f471, %f176;
	lg2.approx.ftz.f32 	%f472, %f471;
	mul.ftz.f32 	%f473, %f472, 0f3ED55555;
	ex2.approx.ftz.f32 	%f474, %f473;
	neg.ftz.f32 	%f564, %f474;
	bra.uni 	BB4_115;

BB4_113:
	lg2.approx.ftz.f32 	%f469, %f176;
	mul.ftz.f32 	%f470, %f469, 0f3ED55555;
	ex2.approx.ftz.f32 	%f564, %f470;

BB4_115:
	ld.volatile.shared.f32 	%f475, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix];
	ld.volatile.shared.f32 	%f476, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+4];
	mul.ftz.f32 	%f477, %f170, %f476;
	fma.rn.ftz.f32 	%f478, %f169, %f475, %f477;
	ld.volatile.shared.f32 	%f479, [_ZZ69PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_KernelE6matrix+8];
	fma.rn.ftz.f32 	%f180, %f171, %f479, %f478;
	setp.ltu.ftz.f32	%p55, %f180, 0f00000000;
	@%p55 bra 	BB4_117;
	bra.uni 	BB4_116;

BB4_117:
	neg.ftz.f32 	%f482, %f180;
	lg2.approx.ftz.f32 	%f483, %f482;
	mul.ftz.f32 	%f484, %f483, 0f3ED55555;
	ex2.approx.ftz.f32 	%f485, %f484;
	neg.ftz.f32 	%f565, %f485;
	bra.uni 	BB4_119;

BB4_116:
	lg2.approx.ftz.f32 	%f480, %f180;
	mul.ftz.f32 	%f481, %f480, 0f3ED55555;
	ex2.approx.ftz.f32 	%f565, %f481;

BB4_119:
	add.s32 	%r171, %r21, -1;
	sub.s32 	%r172, %r171, %r4;
	setp.eq.s32	%p56, %r18, 0;
	selp.b32	%r173, %r4, %r172, %p56;
	mul.lo.s32 	%r11, %r173, %r17;
	add.s32 	%r12, %r11, %r3;
	@%p8 bra 	BB4_121;

	cvta.to.global.u64 	%rd74, %rd6;
	mul.wide.s32 	%rd75, %r12, 16;
	add.s64 	%rd76, %rd74, %rd75;
	st.global.v4.f32 	[%rd76], {%f539, %f540, %f541, %f515};
	bra.uni 	BB4_122;

BB4_121:
	cvta.to.global.u64 	%rd77, %rd6;
	// inline asm
	{  cvt.rn.f16.f32 %rs23, %f539;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs24, %f540;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs25, %f541;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs26, %f515;}

	// inline asm
	mul.wide.s32 	%rd78, %r12, 8;
	add.s64 	%rd79, %rd77, %rd78;
	st.global.u16 	[%rd79], %rs23;
	st.global.u16 	[%rd79+2], %rs24;
	st.global.u16 	[%rd79+4], %rs25;
	st.global.u16 	[%rd79+6], %rs26;

BB4_122:
	add.s32 	%r184, %r3, %r11;
	add.s32 	%r13, %r184, 1;
	@%p8 bra 	BB4_124;

	cvta.to.global.u64 	%rd80, %rd6;
	mul.wide.s32 	%rd81, %r13, 16;
	add.s64 	%rd82, %rd80, %rd81;
	st.global.v4.f32 	[%rd82], {%f547, %f548, %f549, %f519};
	bra.uni 	BB4_125;

BB4_124:
	cvta.to.global.u64 	%rd83, %rd6;
	// inline asm
	{  cvt.rn.f16.f32 %rs27, %f547;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs28, %f548;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs29, %f549;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs30, %f519;}

	// inline asm
	mul.wide.s32 	%rd84, %r13, 8;
	add.s64 	%rd85, %rd83, %rd84;
	st.global.u16 	[%rd85], %rs27;
	st.global.u16 	[%rd85+2], %rs28;
	st.global.u16 	[%rd85+4], %rs29;
	st.global.u16 	[%rd85+6], %rs30;

BB4_125:
	selp.b32	%r193, 1, -1, %p56;
	add.s32 	%r194, %r173, %r193;
	mul.lo.s32 	%r14, %r194, %r17;
	add.s32 	%r15, %r14, %r3;
	@%p8 bra 	BB4_127;

	cvta.to.global.u64 	%rd86, %rd6;
	mul.wide.s32 	%rd87, %r15, 16;
	add.s64 	%rd88, %rd86, %rd87;
	st.global.v4.f32 	[%rd88], {%f555, %f556, %f557, %f523};
	bra.uni 	BB4_128;

BB4_127:
	cvta.to.global.u64 	%rd89, %rd6;
	// inline asm
	{  cvt.rn.f16.f32 %rs31, %f555;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs32, %f556;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs33, %f557;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs34, %f523;}

	// inline asm
	mul.wide.s32 	%rd90, %r15, 8;
	add.s64 	%rd91, %rd89, %rd90;
	st.global.u16 	[%rd91], %rs31;
	st.global.u16 	[%rd91+2], %rs32;
	st.global.u16 	[%rd91+4], %rs33;
	st.global.u16 	[%rd91+6], %rs34;

BB4_128:
	add.s32 	%r205, %r3, %r14;
	add.s32 	%r16, %r205, 1;
	@%p8 bra 	BB4_130;

	cvta.to.global.u64 	%rd92, %rd6;
	mul.wide.s32 	%rd93, %r16, 16;
	add.s64 	%rd94, %rd92, %rd93;
	st.global.v4.f32 	[%rd94], {%f563, %f564, %f565, %f527};
	bra.uni 	BB4_131;

BB4_130:
	cvta.to.global.u64 	%rd95, %rd6;
	// inline asm
	{  cvt.rn.f16.f32 %rs35, %f563;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs36, %f564;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs37, %f565;}

	// inline asm
	// inline asm
	{  cvt.rn.f16.f32 %rs38, %f527;}

	// inline asm
	mul.wide.s32 	%rd96, %r16, 8;
	add.s64 	%rd97, %rd95, %rd96;
	st.global.u16 	[%rd97], %rs35;
	st.global.u16 	[%rd97+2], %rs36;
	st.global.u16 	[%rd97+4], %rs37;
	st.global.u16 	[%rd97+6], %rs38;

BB4_131:
	ret;
}


  ELF3                    @             V @ 8  @    .shstrtab .strtab .symtab .symtab_shndx .nv.info .text.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel .nv.info.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel .nv.shared.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel .nv.constant3 .nv.constant0.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel .rel.nv.constant0.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel .text.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel .nv.info.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel .nv.shared.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel .nv.constant0.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel .rel.nv.constant0.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel .text.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel .nv.info.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel .nv.shared.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel .nv.constant0.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel .rel.nv.constant0.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel .text.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel .nv.info.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel .nv.shared.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel .nv.constant0.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel .rel.nv.constant0.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel .text.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel .nv.info.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel .nv.shared.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel .nv.constant0.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel .rel.nv.constant0.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel .debug_frame .rel.debug_frame .rela.debug_frame .nv.callgraph .nv.prototype .nv.rel.action  .shstrtab .strtab .symtab .symtab_shndx .nv.info .text.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel .nv.info.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel .nv.shared.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel .nv.constant3 kRGB32f_To_601YPbPr k601YPbPr_To_RGB32f kRGB32f_To_601YCbCr k601YCbCr_To_RGB32f kRGB8u_To_601YCbCr k601YCbCr_To_RGB8u kRGB8u_To_601YCbCrFullRange k601YCbCrFullRange_To_RGB8u kRGB32f_To_601YCbCrFullRange k601YCbCrFullRange_To_RGB32f kRGB32f_To_709YPbPr k709YPbPr_To_RGB32f kRGB32f_To_709YCbCr k709YCbCr_To_RGB32f k709YCbCrFullRange_To_RGB32f kRGB8u_To_709YCbCr k709YCbCr_To_RGB8u k709YCbCr_To_601YCbCr k601YCbCr_To_709YCbCr kZeroMatrix kYCbCrOffset kYCbCrFullRangeOffset PQ_m1 PQ_m1Inv PQ_m2 PQ_m2Inv PQ_c1 PQ_c2 PQ_c3 Gamma1886 PQ_Lpeak PQ_a PQ_b PQ_c PQ_s PQ_g scaleFD HLG_a HLG_b HLG_c HLG_inva HLG_alpha HLG_invAlpha HLG_gamma HLG_gammaM1 HLG_gammaM1Dgamma HLG_YR HLG_YG HLG_YB HLG_Lpeak kRandMax .rel.nv.constant0.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel .nv.constant0.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel .text.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel .nv.info.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel .nv.shared.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel .rel.nv.constant0.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel .nv.constant0.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel .text.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel .nv.info.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel .nv.shared.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel .rel.nv.constant0.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel .nv.constant0.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel .text.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel .nv.info.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel .nv.shared.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel .rel.nv.constant0.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel .nv.constant0.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel .text.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel .nv.info.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel .nv.shared.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel .rel.nv.constant0.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel .nv.constant0.PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel .debug_frame .rel.debug_frame .rela.debug_frame .nv.callgraph .nv.prototype .nv.rel.action PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Chroma_Tweak_Kernel PixelFormatConvert_Bayer_To_BGRA_4444_32f_Lumetri_Green_Kernel PixelFormatConvert_Bayer_To_BGRA_4444_32f_Linear_Kernel PixelFormatConvert_Bayer_To_BGRA_4444_32f_Nearest_Kernel PixelFormatConvert_Bayer_To_BGRA_4444_32f_Bayered_Kernel                              2                                                              ,            $       @    $       $       T    H       $       h    l       $       |           $                  $                  $                  $                  $           D      $           h      $       (          $       <          $       P          $       d          $                 $           @      $           d      $                 $                 $                                                                                                                               &                 ,                  2                 <                 E                 J                 O                 T                 Y                 ^                  f    $             l    (             r    ,             x    0                 4                 8                 <                 @                 D                 H                 L                 P                 T                 X             @                                                            	                                                            [                                        k                                        3	                    	                    	
                    9
                    U
                    d
           '      
                 
                 !                  Z                  $        |( ((   4                       '         <   ( l	         $        |( ((   4       p                        ,   ( @         $        |( ((   4                               <   (           $        |( ((   4       P                        <   (          $        |( ((   4                               <   ( <         / J       J       / I       I       / H       H       / G   "    G       / F   (    F        F        G        H        I        J       7    5  
 7   `H H       D        
 @        	 0  A       ,         (         $                                       !         !           !      &  &       7    5  
 9   `8 8       4        
 0        	 ,         (         $                                                         !           !               7    5  
 <   `X X       T         P         @  A       4        
 0        	 ,         (         $                                                         !           !              7    5  
 ?   `X X       T         P         @  A       4        
 0        	 ,         (         $                                                         !           !     P         7    5  
 B   `X X       T         P         @  A       4        
 0        	 ,         (         $                                                         !           !     0                             s          % 6         J            I   $         H             G   D          F   >E?x=!,o   ?   ?F^־膦  ?    t?  ?26  ??    FB C^A!0g  B  BoF%;    ;%;(ɺP%;<    y>?=>>NG
?    J?
?ȾP
?N@    >E?x=,'>>+վ;ߥ  ?    H?  ?6  ??    q}B\C\Ao+1H  B  BX9;    t;;26;;    гY>Y7?ݓ=Vž   ?   ?;  ?    ?  ??  ?M?    j<:BC|AO  B  BuQ$%;    ^;%;!9[%;R<    ;    ;;=?ﺃ;R;    :>5>?}=νY>>B̾$
?    x?
?5^Zl
?1@      ?d=MD>    g}?
    =b{?  ?z콳T    b?ؼ=    J==?                                      A   C   C       C   C  #>k@ BO<  V? ЖA A@ @F?VnB39Cff>  B7> >OV?)@   A=?L>*>>h-?r=  zD                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              z  
       y      !   " z  F   
    Ey  `      y      "   h y      &    y       %    x    p@  r    pVr  / $z    O $z      Ə x       x       z  b  pb  z  a  pfp  G        z  c  pR  z  h       r      x?     x       x	        x       z  h    z	  h  	 x         z  h    |
   	  z \    |    D  %v \    z	 \    z ]  
  z		 ]      y     y      y     " $x     s         s       A s       Ay          {           M	          z  `  pR  $z# ^    x          %v# X              	     b #     %# X             	    b x!               " % X             "    " $z!! ^    $    " %! X         " %! X    	     ( 
    (     h %    (       h      hE     h     b 	! 0    A    !     0    A            % X    0"    A         b 0$    A    "     $         b 0    A    0
    A    %	 X     	     b z  a       x?  |    pb  0%    A    Ey         0	"    A   O r"         0
$    A   ̏ G  `       #    / 	"$    b          % X         0"    A   O Ay         ? z  b       Ey        x?  x    pb  x    pb  r 	       |    pb  r$         |    pf	  G9         x              $z ^    % X    % X          	$    b 0$    A   O Ay          Ey         GI         x              $z ^    x     % X    % X          	    b 0    A   O Ay          x    p  !r"        x  Ey         #x      !r$       $z" ^    !r$        !r        !r$        r 	        #x       x"  !r        %v X     G9  P                	    h % X         0    A   O Ay          Ey         r         G  `       "     	$    b          % X         0    A   O Ay          #x$  	    Ey         0     A    r     `  !r

        r     `  r          G  p       x!           % X     % X    	     j      0     A   O Ay          !r               " !$      !#      !r         0    A    0    A    !r	        3        b 0    A    #x!      0    A    0    A    !r"!         $         @  A   y        0    A    r "    `  y       $  #       "  8@  A  / y        l 3         !$"     O  #@  A  ̏ $ $         @  A  #% "        # #       " !r"	       O #x"       !        "  (%%@  A   !r                  $@  A  O !#     	z e      # %        !r 	                 !!      z  i  pR  #x!       	z d       r     A   !r!        #r       !     O 	z f      #r      / G        y        r     `  y       ( y       h y         #         y        y       "  (UU>  A  O #          r     A   #r       !      #r      /  r     A  ȏ r     `          " #r       #r      r     `  !      3        b  UU>  A           $ !      C          8UU>  A  /         b  UU>  A    HUU>  A  O         "  UU>  A  / 3                 b !      C                 " !     / !      Gy         y        y       ( y       h y         y        y         r     A   #r       #r      /  r     A  O #r       #r       r     ` y        r     `  r     `  y       ( y        h !      3         !      !               #        "  8@  A  O           @  A  Ώ           (@  A  C        0 3          @  A  O  @  A  ̏           H@  A  #                  !     O 	z e      C          r     A           " !     ʏ 	z d      #r       !      	z f      #r      / G        y        r     `  y       ( y       h y         #         y        y       "  (UU>  A  O #          r     A   #r       !      #r      /  r     A  ȏ r     `          " #r       #r      r     `  !     O 3        b  UU>  A           $ !      C          8UU>  A  /         b  UU>  A    HUU>  A  O         "  UU>  A  / 3                 b !      C                 " !     / !      Gy         y        y       ( y        y         y       h y         r     A   #r        r     A  / #r       #r       #r      O r     ` y        r     `  r     `  y       ( y        h !      3         !      !               #        "  8@  A  O           @  A  Ώ           (@  A  C        0 3          @  A  O  @  A  ̏           H@  A  #                  !     O 	z e      C          r     A           " !     ʏ 	z d      #r       !      	z f      #r      / G        y        r     `  y       ( y       h y         #         y        y       "  (UU>  A  O #          r     A   #r       !      #r      /  r     A  ȏ r     `          " #r       #r      r     `  !     O 3        b  UU>  A           $ !      C          8UU>  A  /         b  UU>  A    HUU>  A  O         "  UU>  A  / 3                 b !      C                 " !     / !      Gy         y        y       ( y        y         y       h y         r     A   #r        r     A  / #r       #r       #r      O r 	    ` y        r 
    `  r     `  y       ( y        h !	      3 	        !
      !               # 
       "  8@  A  O           @  A  Ώ           (@  A  C        0 3	          @  A  O  @  A  ̏           H@  A  #                  !	     O 	z	 e      C
          r     A           " !     ʏ 	z	 d      #r	       !
      	z

 f      #r
      / G        y        r     `  y       ( y       h y                  y        y       "  UU>  A  O           r     A   #r	       !      #r
      /  r     A  ȏ r     `          " #r	       #r
      r     `  !     O #	        b  UU>  A           $ !      3
          (	UU>  A  /         b  UU>  A    8
UU>  A  O         "  UU>  A  / #	                 b !      3
                 " !	     / !
      Gy         y        y       ( y        y         y       h y         r     A   #r	        r     A  / #r	       #r	
       #r

      O x         z  _  pR  z b    r       x    $z ^     % Z    x     $z ^   	      $z ^    % Z     G	         x         >r        >r        %v Z    x2v       x2v       y      y     y     y     	      x     % Z     G	         x        / >r        >r        %v Z    x2v       x2v       y      y     y     y     	      % Z    ? G	         x         >r       O >r        %v Z    x 2v        x2v       y      y      y     y     	      M	          x         >r	       / >r

        %v Z    x 2v        x
2v      O y      y      y 
    y     My          Gy    y            y            y            y            y            y            y            y            y            y            y            z  
       y      &   ( y      "   ( y       %   h y      !   b $z     x       $z       / z  c  pb  x        z  b  pfp   M	          z
  c       x
     x
?  z  ^       z  \   
    r	?   ?  r ?   pR  r	   ?  r	        x?     r?        r?        $|
    r   ?  $|     z  F   
    r   ?  |    |     |     z X    |     z Y     z X    y     z Y     y      y     ( y    b x     pb  z  b       Ey        r     ` O r     `  r     ` !      r     `          !              " !      #        p  3	          UU>  A   C        0                  "  UU>  A   !       (UU>  A  /  8		UU>  A  O  HUU>  A             UU>  A  Ώ         "  UU>  A          p #         !      3	 	       0 C                 0         "  UU>  A  / r         G         y    r      ` O !                p           UU>  A  /           UU>  A  O         d !     / Ay          x?          b !      Ey         |    pb  r         G         y     . r      ` O !       C         0         b  HUU>  A   C          UU>  A  /         $ !      Ay         / x?  Ey         !     !	      r         |    pb  GI         y     r     ` O !       #        0           b  (UU>  A   #           UU>  A  /         $ !      Ay          x    pb  x
?  x   Ey  0      x    pb  x    pb  $|      x    px  |    pb  x  r         G         y    r      ` O !       #         0         b  (UU>  A   #          UU>  A  /         $ !      Ay          Ey         |     r  	        G         y   r     ` O !               0         b   UU>  A              UU>  A  /         $ !       Ay          Ey         |    pf  r         G         y     r     ` O !              0         b  UU>  A             UU>  A  /         $ !      Ay          Ey        |   	  r         r         GI         z X    z Y     y      r     ` O !              0         b  UU>  A             UU>  A  /         $ !      Ay          Ey         G         |     |     z X    z Y     y      r     ` O !              0         b  UU>  A             UU>  A  /         $ !      Ay          Ey         r         G         z X    z Y     y     r     ` O !              0         b  UU>  A             UU>  A  /         $ !      Ay          Ey  `      r        r        r 	        r         G         x  $|     |     |     z X    z Y     y      r     ` O !              0         b  UU>  A             UU>  A  /         $ !      Ay          Ey         G9         x     $|     |     |     z X    z Y     y      r     ` O !              0         b  UU>  A             UU>  A  /         $ !      Ay          Ey  0      G9        x     $|     x     |     |     z X    z Y     y      r     ` O !              0         b  UU>  A             UU>  A  /         $ !      Ay          Ey  0      G	        x     $|     x     |     |     z X    z Y     y     r     ` O !              0         b  UU>  A             UU>  A  /         $ !      Ay          x
?  Ey  P      r         |    pb  G	        x     $|     x     |     |     z X    z Y     y      r     ` O !              0         b  UU>  A             UU>  A  /         $ !      Ay          !r         $z `    !r      !r       !r        !r      r     !r       !r	        !r        !r      !r        !r        $z
 `    !r        !r
       !r 	       !r        !r       !r
  @    !r
  @    !r	        !r        !r       !r        !r        !r
       !r        !r
        !r        !r       !r      !r         x  >  A   !r        xL<  A   !r  	         x  >  A   z  a  pR  !r  @    #x   ?    !r         x  >  A   !r        !r	       #x    ?    r       !r 	        !r        #x   ?    !r  @   !r         x  >  A   !r        !r       !r        #x     ?    !r       r       !r       H          x   ?  A            x  >  A   H   ?     %F Z    !r
         xL<  A   H         !r        I      x     !r        r       !r        r       %F Z    H   ?      x   ?  A    x

   ?  A   GI         x         >r        x  <       %v Z    >r        x2v       xv       y      y     y     y     I      GI         x         >r	       / >r

        %v Z    x  <       x2v       y      y     y 
    y     H         !r        H   ?      x   ?  A   !r         %F Z     x   ?  A   H          x   ?  A   x    /  x  >  A   I      2         H   ?     %F Z    GI         x         >r        >r        %v Z    x   <       x2v       y      y     y     y      I      MI          x         >r       / >r        %v Z    x   <       x2v       y      y     y     y      My          Gy    y            y            y            y            y            y            y            y            y            y            z  
       y      !   " z  F   
    Ey  `      y       "   h y      &    y      %    x    p@  r     pVr  / $z     O $z     Ə x       x       z  d  pb  z  c  pfp  G        z  e  pR  z  l       r      x?     x       x	        x       z  l    z
  l  	 x         z  l    |	   D z X    |   	  %v X    z
 X    z	 Y  	   z
 Y    y     y      y     " $x     s         s       A s       Ay          {           M	          z
  d       x     x
?  y        z  ^       z  \   
    y       " r ?   pR  r	?   ?  r	   ?  r	        x?     r?        r?        $|     r   ?  $|     r   ?  |     |     |       z X    |     z X   z Y      z Y     y     y	      y     " r    pR  x  y     ( $|     
    x      r    pR  |     

 X    |   	  

 Y    r    p&  z X    z Y    r        O r 	       ȏ    r         	r         	      r                	        x
?  x     |    pb  $|     z  c       x    / x?  |         |
   	        X   |    pb   Y    y        b r 	        r         |    pfr      b z X        b	 r         r        z Y  
  r
         z  m  pR       h     h 
     d 	z h      !r       O !r       ȏ !r	        !r        x  >  A   !r        	z i      !r          x  >  A    r     A   	z j      #r       #r      / G        y        r     `  y       ( y       h y                  y        y       "  UU>  A  O           r     A   #r       !      #r      /  r     A  ȏ r     `          " #r       #r      r     `  !     O #        b  UU>  A           $ !      3          (UU>  A  /         b  UU>  A    8UU>  A  O         "  UU>  A  / #                 b !      3                 " !     / !      Gy         y        y       ( y        y         y       h y         r     A   r     A  / #r      #r       #r      #r      O z  a  pR  y        z  b  pR  !r       !r         y       " 	z i       x   ?  A    x   ?  A   y        f 	z h           (         (   ?     $z `    	z j      %& Z    )       r     A   #r       G)         x        o >r        >r        %v Z    x  <       xv       x2v       y      xv       y     y     y     #r       G        y        r     `  y       ( y       h y         3         y        y       "  8UU>  A  O 3          r     A   #r       !      #r      /  r     A  ȏ r     `          " #r       #r      r     `  !      C        b  UU>  A           $ !      S          HUU>  A  /         b  UU>  A    XUU>  A  O         "  UU>  A  / C                 b !      S                 " !     / !      Gy         y        y       ( y       h y         y        y         r     A   #r       #r      /  r     A  O #r       #r       y        x     !r
        (         y       " (   ?     !r          x   ?  A   y        b %& Z    	z	 i       x   ?  A   	z h      )      	z j       r     A   #r       G)         x        o >r        >r        %v Z    x  <       xv       x2v       y      xv       y     y     y     #r       G        y        r     `  y       ( y       h y         3         y        y       "  8UU>  A  O 3          r     A   #r       !      #r      /  r     A  ȏ r     `          " #r       #r      r     `  !      C        b  UU>  A           $ !      S          HUU>  A  /         b  UU>  A    XUU>  A  O         "  UU>  A  / C                 b !      S                 " !     / !      Gy         y        y       ( y       h y         y        y         r     A   #r       #r      /  r     A  O #r       #r       y        !r	        x	     !r
        y       " !r        	  !r        y        b !r        (         $z	 `    (   ?      x  >  A    x  >  A   %&
 Z    	z   j      	z i      ) 
     	z h       r     A   #r       G)         x        o >r        >r        %v Z    x
  <       xv       x2v       y      x
v       y     y     y     #r        G        y        r     `  y
       ( y       h y                  y        y       "  UU>  A  O           r
     A   #r       !      #r       /  r     A  ȏ r     `          " #r       #r       r     `  !               b  UU>  A             $ !
      3          UU>  A  / 
 
       b   UU>  A    8UU>  A  O         "  
UU>  A  /                  b !      3                 " !     / !      Gy         y        y       ( y
       h y         y        y         r     A   #r       #r 
      /  r     A  O #r       #r        $z	 `    (         (   ?     x      %&  Z    )      M)          x         >r        x  <       %v  Z    >r        x2v       x v        y      y     y     y      My          Gy    y            y            y            y            y            y            y            y            y            y            y            y            y            y            z  
       y      !   " z
  F   
    Ey  `      y      "   h y      &    y       %    x    p@  r    pVr  / $z    O $z       Ə x       x         z  d  pb  z   c  pfp  G        z  e  pR  z  l       r     x?     x       x	        x      z l    z	 l  	 x         z l    |
   D  z X    |   	  %v X    z	 X    z Y  
   z		 Y    y
     y
      y
     " $x     s         s       A s       Ay          {           M	          z  d       x      x?  x     z  ^       y        z  \   
    r ?   pR  r	?   ?  r	   ?  r	        x?     r?        r?        $|    r   ?  $|      $|     r   ?  |	     |     |     z
	 X    |     z X    |     z	 Y     $|      z Y     |	   	  y


       z X    y
      z Y  	   |	     y
     " |     z	 X   y       & z	 Y     y        h y	
     b z  m  pR  	z

 i     O 	z h     Ə  r
     A   #r       	z j     #r      / G        y        r     `  y       ( y       h y                  y        y       "  UU>  A  O           r
     A   #r       !      #r      /  r
     A  ȏ r     `          " #r       #r      r     `  !      #        b  UU>  A           $ !      3          (UU>  A  /         b  UU>  A    8UU>  A  O         "  UU>  A  / #                 b !      3                 " !     / !      Gy         y        y       ( y       h y         y        y         r
     A   #r       #r      /  r
     A  O #r       #r       z  a  pR  y        z  b  pR  y       ( y        h      (         (   ?     $z `     %& Z    )    
   r
     A   #r       G)         x        o >r        >r        %v Z    x  <       xv       x2v       y    
  xv       y   
  y   
  y   
  #r       G        y        r     `  y       ( y       h y         3         y        y       "  8UU>  A  O 3          r
     A   #r       !      #r      /  r
     A  ȏ r     `          " #r       #r      r     `  !
      C        b  UU>  A   
 
       $ !      S          HUU>  A  /         b  
UU>  A    XUU>  A  O         "  UU>  A  / C                 b !      S                 " !     / !      Gy         y        y       ( y       h y         y        y         r
     A   #r       #r      /  r

     A  O #r   
    #r       y        x     (         y       " (   ?     	z		 i     y        b %&
 Z    ) 
   
   r	     A   #r       G)         x        o >r        >r        %v Z    x
  <       xv       x2v       y    
  x
v       y   
  y   
  y   
  #r       G        y        r     `  y       ( y
       h y         3         y        y       "  8UU>  A  O 3          r	     A   #r       !      #r

      /  r	     A  ȏ r 
    `          " #r       #r      r     `  !
      C 
       b  UU>  A           $ !      S          HUU>  A  /         b  
UU>  A    XUU>  A  O         "  UU>  A  / C         
 
       b !      S                 " !
     / !      Gy         y        y       ( y
       h y         y        y         r	     A   #r       #r
      /  r	     A  O #r       #r       y        x      y
       " (         (   ?     y        b $z `     %& Z    )    
   r	
     A   #r       G)         x        o >r        x
  <       %v Z    xv      x2v       >r        y    
  x
v       y   
  y   
  y   
  #r       G        y        r     `  y       ( y
       h y                  y        y       "  UU>  A  O           r	     A   #r       !      #r
      /  r		     A  ȏ r     `          " #r	   	    #r   	   r     `  !              b  UU>  A           $ !
      3          	UU>  A  / 
 
       b  UU>  A    8UU>  A  O         "  
UU>  A  /  	                b !      3                 " !     / !      Gy         y        y       ( y       h y         y
        y         r	     A   #r       #r      /  r
	
     A  O #r   
    #r       $z  `     (         (   ?     x       %&  Z    )    
  M)          x         >r        x  <       %v  Z    >r        x2v       x v        y    
  y   
  y   
  y    
  My          Gy    y            y            y            y            y            y            y            y            y            y            y            y            y            z  
       y      !   " z
  F   
    Ey  `      y      "   h y      &    y       %    x    p@  r    pVr  / $z    O $z       Ə x       x         z  d  pb  z   c  pfp  G        z  e  pR  z  l       r     x?     x       x	        x      z l    z	 l  	 x         z l    |
   D  z X    |   	  %v X    z	 X    z Y  
   z		 Y    y
     y
      y
     " $x     s         s       A s       Ay          {           M	          z  d       y	        z  ^       z  \   
    y       " x?  r	?   ?  y        b r ?   pR  r	   ?  r	        x?     r?        $|     r?        r   ?  r      r   ?  |     |     z X    z Y     y
      z  m  pR  z  a  pR  |      r     A  O 	z j      	z
 i     	z h       r
     A   #r	       r	        #r      / G        y        r     `  y       ( y       h y         #         y        y       "  (UU>  A  O #          r
     A   #r       !      #r      /  r
     A  ȏ r     `          " #r       #r      r     `  !     O 3
        b  UU>  A           $ !      C          8
UU>  A  /         b  
UU>  A    HUU>  A  O         "  UU>  A  / 3         
 
       b !      C                 " !
     / !      Gy         y        y       ( y       h y         y        y         r
     A   #r       #r      /  r

     A  O #r   
    #r       z  b  pR  $z	 `     x      r
     |
     (         (   ?     |
   	  %& Z    z
 X    )    
  z Y    G)         x         >r        >r        %v Z    x  <       xv       x2v       y    
  xv       y   
  y   
  y   
  y


      y        y       ( y        b  r
     A  O 	z
 i      	z h      r     A   	z j      #r       #r      / G        y        r     `  y       ( y       h y         3         y        y       "  8
UU>  A  O 3 
         r     A   #r       !      #r      /  r     A  ȏ r     `          " #r       #r      r     `  !
     O C        b  UU>  A   
 
       $ !      S          HUU>  A  /         b  
UU>  A    XUU>  A  O         "  UU>  A  / C                 b !      S                 " !     / !      Gy         y        y
       ( y        y         y       h y         r

     A   r     A  / #r   
   #r       #r      #r      O (         $z	 `    (   ?     x     %& Z    $|     )    
  r
      |
     |
   	  z
 X    z Y    G)         x         >r        >r        %v Z    x  <       xv       x2v       y    
  xv       y   
  y   
  y   
  y


      y        y       ( y        b  r
     A  O 	z
 i      	z h      r     A   	z j      #r       #r      / G        y        r     `  y       ( y       h y         3         y        y       "  8
UU>  A  O 3 
         r     A   #r       !      #r      /  r     A  ȏ r     `          " #r       #r      r     `  !
     O C        b  UU>  A   
 
       $ !      S          HUU>  A  /         b  
UU>  A    XUU>  A  O         "  UU>  A  / C                 b !      S                 " !     / !      Gy         y        y
       ( y        y         y       h y         r

     A   r     A  / #r   
   #r       #r      #r      O r     y        x	     |     	  |   	  z X    $z  `     >
        z	 Y    (                  >        >        %  Z    x
v       (   ?     %&
  Z    x  <       xv       xv       ) 
   
      
     
     
     
  y
      y       h y          r      A  O 	z h      	z  i     	z  j       r     A  / #r       #r       G        y
        r     `  y       ( y	       h y                   y        y       "   UU>  A  O           r      A   #r
        !       #r		      /  r     A  ȏ r 	    `            " #r       #r      r     `  !	     O  	       b   UU>  A           $ !      3          
UU>  A  /         b   UU>  A    8UU>  A  O         "  	UU>  A  /  
                  b !      3         	 	       " !      / !	      Gy         y         y       ( y	        y
         y       h y         r     A   #r         r     A  / #r
       #r	       #r      O (	         $z  `    (   ?     %&  Z  	  )    
  M)          x         >r        x  <       %v  Z    >r        x2v       x v        y    
  y   
  y   
  y    
  My          Gy    y            y            y            y            y            y            y            y            y            y            y            y            y            y            y                                                                                                  @                                                                                                                                  F                 M                           0                             )      p                                                   ~      p@               l                                       p@               d                                       p@               \      (                                p@                      (                           5     p@               !      (                           }    p                "                                       p                "                                   Z  	   @               #      P                                               X#      \                             ,     B               &                                       B               \(                                       B               )                                  d     B               +                                       B               d-                                  2                    /      '         F  (                                    W               G  "               M                   u               H                                                     I                                                     J                       C                      $                                  C                      $                                   C                      $                             w     C                      $                                   @                                                 X#                                                                                                  @                                           