A   Q      ,      `8$ҴAug 14 202405:08:24HOST64sm_86//
// Generated by NVIDIA NVVM Compiler
//
// Compiler Build ID: CL-31833905
// Cuda compilation tools, release 11.8, V11.8.89
// Based on NVVM 7.0.1
//

.version 7.8
.target sm_50
.address_size 64

	// .globl	GradientWipeKernel
.const .align 4 .b8 kRGB32f_To_601YPbPr[36] = {135, 22, 153, 62, 162, 69, 22, 63, 213, 120, 233, 61, 33, 201, 44, 190, 111, 155, 169, 190, 0, 0, 0, 63, 0, 0, 0, 63, 70, 94, 214, 190, 232, 134, 166, 189};
.const .align 4 .b8 k601YPbPr_To_RGB32f[36] = {0, 0, 128, 63, 0, 0, 0, 0, 188, 116, 179, 63, 0, 0, 128, 63, 152, 50, 176, 190, 158, 209, 54, 191, 0, 0, 128, 63, 229, 208, 226, 63, 0, 0, 0, 0};
.const .align 4 .b8 kRGB32f_To_601YCbCr[36] = {70, 246, 130, 66, 145, 141, 0, 67, 94, 186, 199, 65, 33, 48, 23, 194, 240, 103, 148, 194, 0, 0, 224, 66, 0, 0, 224, 66, 111, 146, 187, 194, 70, 182, 145, 193};
.const .align 4 .b8 k601YCbCr_To_RGB32f[36] = {37, 160, 149, 59, 0, 0, 0, 0, 182, 23, 205, 59, 37, 160, 149, 59, 40, 15, 201, 186, 156, 239, 80, 187, 37, 160, 149, 59, 236, 155, 1, 60, 0, 0, 0, 0};
.const .align 4 .b8 kRGB8u_To_601YCbCr[36] = {219, 121, 131, 62, 152, 14, 1, 63, 18, 131, 200, 61, 174, 199, 23, 190, 238, 252, 148, 190, 197, 224, 224, 62, 197, 224, 224, 62, 217, 78, 188, 190, 174, 71, 146, 189};
.const .align 4 .b8 k601YCbCr_To_RGB8u[36] = {127, 10, 149, 63, 0, 0, 0, 0, 160, 74, 204, 63, 127, 10, 149, 63, 254, 148, 200, 190, 184, 30, 80, 191, 127, 10, 149, 63, 78, 26, 1, 64, 0, 0, 0, 0};
.const .align 4 .b8 kRGB8u_To_601YCbCrFullRange[36] = {135, 22, 153, 62, 162, 69, 22, 63, 213, 120, 233, 61, 166, 27, 44, 190, 39, 241, 168, 190, 250, 254, 254, 62, 250, 254, 254, 62, 43, 135, 213, 190, 59, 223, 165, 189};
.const .align 4 .b8 k601YCbCrFullRange_To_RGB8u[36] = {0, 0, 128, 63, 0, 0, 0, 0, 72, 193, 178, 63, 0, 0, 128, 63, 143, 130, 175, 190, 225, 26, 54, 191, 0, 0, 128, 63, 20, 238, 225, 63, 0, 0, 0, 0};
.const .align 4 .b8 kRGB32f_To_601YCbCrFullRange[36] = {113, 125, 152, 66, 92, 175, 21, 67, 92, 143, 232, 65, 158, 111, 43, 194, 49, 72, 168, 194, 0, 0, 254, 66, 0, 0, 254, 66, 170, 177, 212, 194, 88, 57, 165, 193};
.const .align 4 .b8 k601YCbCrFullRange_To_RGB32f[36] = {129, 128, 128, 59, 0, 0, 0, 0, 189, 116, 179, 59, 129, 128, 128, 59, 194, 50, 176, 186, 179, 209, 54, 187, 129, 128, 128, 59, 229, 208, 226, 59, 0, 0, 0, 0};
.const .align 4 .b8 kRGB32f_To_709YPbPr[36] = {208, 179, 89, 62, 89, 23, 55, 63, 152, 221, 147, 61, 186, 164, 234, 189, 210, 86, 197, 190, 0, 0, 0, 63, 0, 0, 0, 63, 190, 134, 232, 190, 16, 202, 59, 189};
.const .align 4 .b8 k709YPbPr_To_RGB32f[36] = {0, 0, 128, 63, 0, 0, 0, 0, 12, 147, 201, 63, 0, 0, 128, 63, 221, 209, 63, 190, 243, 173, 239, 190, 0, 0, 128, 63, 77, 132, 237, 63, 0, 0, 0, 0};
.const .align 4 .b8 kRGB32f_To_709YCbCr[36] = {106, 60, 58, 66, 6, 161, 28, 67, 244, 253, 124, 65, 223, 79, 205, 193, 8, 172, 172, 194, 0, 0, 224, 66, 0, 0, 224, 66, 195, 117, 203, 194, 236, 81, 36, 193};
.const .align 4 .b8 k709YCbCr_To_RGB32f[36] = {37, 160, 149, 59, 0, 0, 0, 0, 239, 94, 230, 59, 37, 160, 149, 59, 33, 57, 91, 186, 178, 245, 8, 187, 37, 160, 149, 59, 82, 185, 7, 60, 0, 0, 0, 0};
.const .align 4 .b8 k709YCbCrFullRange_To_RGB32f[36] = {131, 128, 128, 59, 0, 0, 0, 0, 28, 147, 201, 59, 131, 128, 128, 59, 61, 210, 63, 186, 248, 173, 239, 186, 131, 128, 128, 59, 82, 132, 237, 59, 0, 0, 0, 0};
.const .align 4 .b8 kRGB8u_To_709YCbCr[36] = {207, 247, 58, 62, 53, 62, 29, 63, 231, 251, 125, 61, 184, 30, 206, 189, 23, 89, 173, 190, 197, 224, 224, 62, 197, 224, 224, 62, 12, 66, 204, 190, 195, 245, 36, 189};
.const .align 4 .b8 k709YCbCr_To_RGB8u[36] = {127, 10, 149, 63, 0, 0, 0, 0, 147, 120, 229, 63, 127, 10, 149, 63, 53, 94, 90, 190, 205, 108, 8, 191, 127, 10, 149, 63, 154, 49, 7, 64, 0, 0, 0, 0};
.const .align 4 .b8 k709YCbCr_To_601YCbCr[36] = {0, 0, 128, 63, 23, 100, 203, 61, 1, 77, 68, 62, 0, 0, 0, 0, 18, 103, 125, 63, 10, 158, 226, 189, 0, 0, 0, 0, 61, 98, 148, 189, 249, 191, 123, 63};
.const .align 4 .b8 k601YCbCr_To_709YCbCr[36] = {0, 0, 128, 63, 122, 165, 236, 189, 179, 237, 84, 190, 0, 0, 0, 0, 204, 98, 130, 63, 216, 188, 234, 61, 0, 0, 0, 0, 74, 179, 153, 61, 234, 61, 131, 63};
.const .align 4 .b8 kZeroMatrix[36];
.const .align 4 .b8 kYCbCrOffset[12] = {0, 0, 128, 65, 0, 0, 0, 67, 0, 0, 0, 67};
.const .align 4 .b8 kYCbCrFullRangeOffset[12] = {0, 0, 0, 0, 0, 0, 0, 67, 0, 0, 0, 67};
.const .align 4 .f32 PQ_m1 = 0f3E232000;
.const .align 4 .f32 PQ_m1Inv = 0f40C8E06B;
.const .align 4 .f32 PQ_m2 = 0f429DB000;
.const .align 4 .f32 PQ_m2Inv = 0f3C4FCDAC;
.const .align 4 .f32 PQ_c1 = 0f3F560000;
.const .align 4 .f32 PQ_c2 = 0f4196D000;
.const .align 4 .f32 PQ_c3 = 0f41958000;
.const .align 4 .f32 Gamma1886 = 0f4019999A;
.const .align 4 .f32 PQ_Lpeak = 0f461C4000;
.const .align 4 .f32 PQ_a = 0f3F8CAC08;
.const .align 4 .f32 PQ_b = 0f426E1556;
.const .align 4 .f32 PQ_c = 0f39B033E5;
.const .align 4 .f32 PQ_s = 0f4385EB85;
.const .align 4 .f32 PQ_g = 0f3EE66666;
.const .align 4 .f32 scaleFD = 0f42C80000;
.const .align 4 .f32 HLG_a = 0f3E371FF0;
.const .align 4 .f32 HLG_b = 0f3E91C020;
.const .align 4 .f32 HLG_c = 0f3F0F564F;
.const .align 4 .f32 HLG_inva = 0f40B2F029;
.const .align 4 .f32 HLG_alpha = 0f41200000;
.const .align 4 .f32 HLG_invAlpha = 0f3DCCCCCD;
.const .align 4 .f32 HLG_gamma = 0f3F99999A;
.const .align 4 .f32 HLG_gammaM1 = 0f3E4CCCCD;
.const .align 4 .f32 HLG_gammaM1Dgamma = 0f3E2AAAAB;
.const .align 4 .f32 HLG_YR = 0f3E86809D;
.const .align 4 .f32 HLG_YG = 0f3F2D9168;
.const .align 4 .f32 HLG_YB = 0f3D72E48F;
.const .align 4 .f32 HLG_Lpeak = 0f447A0000;
.const .align 4 .u32 kRandMax = 32767;
.global .texref inBilinearSrc;
.global .texref inPointSrc;

.visible .entry GradientWipeKernel(
	.param .u64 GradientWipeKernel_param_0,
	.param .u64 GradientWipeKernel_param_1,
	.param .u64 GradientWipeKernel_param_2,
	.param .align 16 .b8 GradientWipeKernel_param_3[16],
	.param .align 16 .b8 GradientWipeKernel_param_4[16],
	.param .align 16 .b8 GradientWipeKernel_param_5[16],
	.param .align 8 .b8 GradientWipeKernel_param_6[8],
	.param .u32 GradientWipeKernel_param_7,
	.param .align 16 .b8 GradientWipeKernel_param_8[16],
	.param .u32 GradientWipeKernel_param_9,
	.param .u32 GradientWipeKernel_param_10,
	.param .u32 GradientWipeKernel_param_11
)
{
	.reg .pred 	%p<57>;
	.reg .b16 	%rs<29>;
	.reg .f32 	%f<364>;
	.reg .b32 	%r<50>;
	.reg .b64 	%rd<30>;


	ld.param.u64 	%rd11, [GradientWipeKernel_param_0];
	ld.param.u64 	%rd12, [GradientWipeKernel_param_1];
	ld.param.u64 	%rd13, [GradientWipeKernel_param_2];
	ld.param.u32 	%r24, [GradientWipeKernel_param_7];
	ld.param.u32 	%r25, [GradientWipeKernel_param_9];
	ld.param.u32 	%r26, [GradientWipeKernel_param_10];
	ld.param.u32 	%r27, [GradientWipeKernel_param_11];
	ld.param.f32 	%f156, [GradientWipeKernel_param_8+12];
	ld.param.f32 	%f155, [GradientWipeKernel_param_8+8];
	ld.param.f32 	%f154, [GradientWipeKernel_param_8+4];
	ld.param.f32 	%f153, [GradientWipeKernel_param_8];
	ld.param.u32 	%r22, [GradientWipeKernel_param_5+8];
	ld.param.u32 	%r21, [GradientWipeKernel_param_5+4];
	ld.param.u32 	%r20, [GradientWipeKernel_param_5];
	ld.param.u32 	%r18, [GradientWipeKernel_param_4+8];
	ld.param.u32 	%r17, [GradientWipeKernel_param_4+4];
	ld.param.u32 	%r16, [GradientWipeKernel_param_4];
	ld.param.u32 	%r14, [GradientWipeKernel_param_3+8];
	ld.param.u32 	%r13, [GradientWipeKernel_param_3+4];
	ld.param.u32 	%r12, [GradientWipeKernel_param_3];
	ld.param.u32 	%r28, [GradientWipeKernel_param_6+4];
	ld.param.u32 	%r29, [GradientWipeKernel_param_6];
	cvta.to.global.u64 	%rd1, %rd13;
	cvta.to.global.u64 	%rd2, %rd12;
	cvta.to.global.u64 	%rd3, %rd11;
	mov.u32 	%r30, %ntid.x;
	mov.u32 	%r31, %ctaid.x;
	mov.u32 	%r32, %tid.x;
	mad.lo.s32 	%r1, %r31, %r30, %r32;
	mov.u32 	%r33, %ntid.y;
	mov.u32 	%r34, %ctaid.y;
	mov.u32 	%r35, %tid.y;
	mad.lo.s32 	%r2, %r34, %r33, %r35;
	add.s32 	%r3, %r29, %r1;
	add.s32 	%r4, %r28, %r2;
	setp.ge.u32 	%p5, %r1, %r20;
	setp.ge.u32 	%p6, %r2, %r21;
	or.pred  	%p7, %p5, %p6;
	@%p7 bra 	$L__BB0_49;

	setp.ge.s32 	%p8, %r3, %r12;
	or.b32  	%r36, %r3, %r4;
	setp.lt.s32 	%p9, %r36, 0;
	or.pred  	%p10, %p8, %p9;
	setp.ge.s32 	%p11, %r4, %r13;
	mov.f32 	%f320, 0f00000000;
	or.pred  	%p12, %p11, %p10;
	mov.f32 	%f321, %f320;
	mov.f32 	%f322, %f320;
	mov.f32 	%f323, %f320;
	@%p12 bra 	$L__BB0_5;

	mad.lo.s32 	%r37, %r4, %r14, %r3;
	cvt.s64.s32 	%rd4, %r37;
	setp.eq.s32 	%p13, %r24, 0;
	@%p13 bra 	$L__BB0_4;

	shl.b64 	%rd14, %rd4, 4;
	add.s64 	%rd15, %rd3, %rd14;
	ld.global.v4.f32 	{%f323, %f322, %f321, %f320}, [%rd15];
	bra.uni 	$L__BB0_5;

$L__BB0_4:
	shl.b64 	%rd16, %rd4, 3;
	add.s64 	%rd17, %rd3, %rd16;
	ld.global.u16 	%rs1, [%rd17];
	ld.global.u16 	%rs2, [%rd17+2];
	ld.global.u16 	%rs3, [%rd17+4];
	ld.global.u16 	%rs4, [%rd17+6];
	// begin inline asm
	{  cvt.f32.f16 %f323, %rs1;}

	// end inline asm
	// begin inline asm
	{  cvt.f32.f16 %f322, %rs2;}

	// end inline asm
	// begin inline asm
	{  cvt.f32.f16 %f321, %rs3;}

	// end inline asm
	// begin inline asm
	{  cvt.f32.f16 %f320, %rs4;}

	// end inline asm

$L__BB0_5:
	setp.eq.s32 	%p14, %r26, 0;
	@%p14 bra 	$L__BB0_46;

	mov.f32 	%f324, 0f00000000;
	setp.eq.s32 	%p15, %r27, 1;
	@%p15 bra 	$L__BB0_11;

	setp.eq.s32 	%p16, %r27, 2;
	@%p16 bra 	$L__BB0_10;

	setp.ne.s32 	%p17, %r27, 3;
	mov.f32 	%f325, %f324;
	@%p17 bra 	$L__BB0_12;

	cvt.rn.f32.u32 	%f171, %r1;
	cvt.rn.f32.u32 	%f172, %r20;
	cvt.rn.f32.u32 	%f173, %r16;
	div.approx.ftz.f32 	%f174, %f173, %f172;
	mul.ftz.f32 	%f324, %f174, %f171;
	cvt.rn.f32.u32 	%f175, %r2;
	cvt.rn.f32.u32 	%f176, %r17;
	cvt.rn.f32.u32 	%f177, %r21;
	div.approx.ftz.f32 	%f178, %f176, %f177;
	mul.ftz.f32 	%f325, %f178, %f175;
	bra.uni 	$L__BB0_12;

$L__BB0_11:
	rem.u32 	%r40, %r1, %r16;
	cvt.rn.f32.u32 	%f324, %r40;
	rem.u32 	%r41, %r2, %r17;
	cvt.rn.f32.u32 	%f325, %r41;
	bra.uni 	$L__BB0_12;

$L__BB0_10:
	cvt.rn.f32.u32 	%f179, %r1;
	sub.s32 	%r38, %r16, %r20;
	cvt.rn.f32.s32 	%f180, %r38;
	mov.f32 	%f181, 0f40000000;
	div.approx.ftz.f32 	%f182, %f180, %f181;
	add.ftz.f32 	%f324, %f182, %f179;
	sub.s32 	%r39, %r17, %r21;
	cvt.rn.f32.s32 	%f183, %r39;
	div.approx.ftz.f32 	%f184, %f183, %f181;
	cvt.rn.f32.u32 	%f185, %r2;
	add.ftz.f32 	%f325, %f184, %f185;

$L__BB0_12:
	cvt.rn.f32.s32 	%f190, %r16;
	setp.geu.ftz.f32 	%p18, %f324, %f190;
	setp.ltu.ftz.f32 	%p19, %f324, 0f00000000;
	mov.f32 	%f362, 0f00000000;
	or.pred  	%p20, %p19, %p18;
	setp.ltu.ftz.f32 	%p21, %f325, 0f00000000;
	or.pred  	%p22, %p20, %p21;
	cvt.rn.f32.s32 	%f191, %r17;
	setp.geu.ftz.f32 	%p23, %f325, %f191;
	or.pred  	%p24, %p23, %p22;
	mov.f32 	%f358, %f362;
	mov.f32 	%f359, %f362;
	mov.f32 	%f360, %f362;
	mov.f32 	%f361, %f362;
	@%p24 bra 	$L__BB0_42;

	setp.eq.s32 	%p25, %r25, 0;
	@%p25 bra 	$L__BB0_39;

	cvt.rmi.ftz.f32.f32 	%f196, %f324;
	cvt.rzi.ftz.s32.f32 	%r10, %f196;
	cvt.rmi.ftz.f32.f32 	%f197, %f325;
	cvt.rzi.ftz.s32.f32 	%r42, %f197;
	cvt.rn.f32.s32 	%f198, %r10;
	sub.ftz.f32 	%f21, %f324, %f198;
	cvt.rn.f32.s32 	%f199, %r42;
	sub.ftz.f32 	%f22, %f325, %f199;
	add.s32 	%r43, %r10, 1;
	add.s32 	%r11, %r42, 1;
	setp.gt.s32 	%p26, %r10, -1;
	setp.lt.s32 	%p27, %r10, %r16;
	and.pred  	%p1, %p26, %p27;
	setp.gt.s32 	%p28, %r10, -2;
	setp.lt.s32 	%p29, %r43, %r16;
	and.pred  	%p2, %p28, %p29;
	setp.gt.s32 	%p30, %r42, -1;
	setp.lt.s32 	%p31, %r42, %r17;
	and.pred  	%p3, %p30, %p31;
	setp.gt.s32 	%p32, %r42, -2;
	setp.lt.s32 	%p33, %r11, %r17;
	and.pred  	%p4, %p32, %p33;
	and.pred  	%p34, %p1, %p3;
	mad.lo.s32 	%r44, %r42, %r18, %r10;
	mul.wide.s32 	%rd18, %r44, 16;
	add.s64 	%rd5, %rd2, %rd18;
	mul.wide.s32 	%rd19, %r44, 8;
	add.s64 	%rd6, %rd2, %rd19;
	mov.f32 	%f59, 0f00000000;
	not.pred 	%p35, %p34;
	mov.f32 	%f39, %f59;
	mov.f32 	%f40, %f59;
	mov.f32 	%f41, %f59;
	mov.f32 	%f333, %f59;
	@%p35 bra 	$L__BB0_19;

	setp.eq.s32 	%p36, %r24, 0;
	@%p36 bra 	$L__BB0_17;

	ld.global.v4.f32 	{%f39, %f40, %f41, %f333}, [%rd5];
	bra.uni 	$L__BB0_19;

$L__BB0_39:
	cvt.rzi.ftz.s32.f32 	%r46, %f324;
	cvt.rzi.ftz.s32.f32 	%r47, %f325;
	mad.lo.s32 	%r48, %r47, %r18, %r46;
	cvt.s64.s32 	%rd9, %r48;
	setp.eq.s32 	%p53, %r24, 0;
	@%p53 bra 	$L__BB0_41;

	shl.b64 	%rd22, %rd9, 4;
	add.s64 	%rd23, %rd2, %rd22;
	ld.global.v4.f32 	{%f361, %f360, %f359, %f358}, [%rd23];
	bra.uni 	$L__BB0_42;

$L__BB0_41:
	shl.b64 	%rd24, %rd9, 3;
	add.s64 	%rd25, %rd2, %rd24;
	ld.global.u16 	%rs21, [%rd25];
	ld.global.u16 	%rs22, [%rd25+2];
	ld.global.u16 	%rs23, [%rd25+4];
	ld.global.u16 	%rs24, [%rd25+6];
	// begin inline asm
	{  cvt.f32.f16 %f361, %rs21;}

	// end inline asm
	// begin inline asm
	{  cvt.f32.f16 %f360, %rs22;}

	// end inline asm
	// begin inline asm
	{  cvt.f32.f16 %f359, %rs23;}

	// end inline asm
	// begin inline asm
	{  cvt.f32.f16 %f358, %rs24;}

	// end inline asm
	bra.uni 	$L__BB0_42;

$L__BB0_17:
	ld.global.u16 	%rs5, [%rd6];
	ld.global.u16 	%rs6, [%rd6+2];
	ld.global.u16 	%rs7, [%rd6+4];
	ld.global.u16 	%rs8, [%rd6+6];
	// begin inline asm
	{  cvt.f32.f16 %f39, %rs5;}

	// end inline asm
	// begin inline asm
	{  cvt.f32.f16 %f40, %rs6;}

	// end inline asm
	// begin inline asm
	{  cvt.f32.f16 %f41, %rs7;}

	// end inline asm
	// begin inline asm
	{  cvt.f32.f16 %f333, %rs8;}

	// end inline asm

$L__BB0_19:
	and.pred  	%p37, %p2, %p3;
	not.pred 	%p38, %p37;
	mov.f32 	%f60, %f59;
	mov.f32 	%f61, %f59;
	mov.f32 	%f341, %f59;
	@%p38 bra 	$L__BB0_24;

	setp.eq.s32 	%p39, %r24, 0;
	@%p39 bra 	$L__BB0_22;

	ld.global.v4.f32 	{%f59, %f60, %f61, %f341}, [%rd5+16];
	bra.uni 	$L__BB0_24;

$L__BB0_22:
	ld.global.u16 	%rs9, [%rd6+8];
	ld.global.u16 	%rs10, [%rd6+10];
	ld.global.u16 	%rs11, [%rd6+12];
	ld.global.u16 	%rs12, [%rd6+14];
	// begin inline asm
	{  cvt.f32.f16 %f59, %rs9;}

	// end inline asm
	// begin inline asm
	{  cvt.f32.f16 %f60, %rs10;}

	// end inline asm
	// begin inline asm
	{  cvt.f32.f16 %f61, %rs11;}

	// end inline asm
	// begin inline asm
	{  cvt.f32.f16 %f341, %rs12;}

	// end inline asm

$L__BB0_24:
	mad.lo.s32 	%r45, %r11, %r18, %r10;
	mul.wide.s32 	%rd20, %r45, 16;
	add.s64 	%rd7, %rd2, %rd20;
	mul.wide.s32 	%rd21, %r45, 8;
	add.s64 	%rd8, %rd2, %rd21;
	and.pred  	%p40, %p1, %p4;
	mov.f32 	%f99, 0f00000000;
	not.pred 	%p41, %p40;
	mov.f32 	%f79, %f99;
	mov.f32 	%f80, %f99;
	mov.f32 	%f81, %f99;
	mov.f32 	%f349, %f99;
	@%p41 bra 	$L__BB0_29;

	setp.eq.s32 	%p42, %r24, 0;
	@%p42 bra 	$L__BB0_27;

	ld.global.v4.f32 	{%f79, %f80, %f81, %f349}, [%rd7];
	bra.uni 	$L__BB0_29;

$L__BB0_27:
	ld.global.u16 	%rs13, [%rd8];
	ld.global.u16 	%rs14, [%rd8+2];
	ld.global.u16 	%rs15, [%rd8+4];
	ld.global.u16 	%rs16, [%rd8+6];
	// begin inline asm
	{  cvt.f32.f16 %f79, %rs13;}

	// end inline asm
	// begin inline asm
	{  cvt.f32.f16 %f80, %rs14;}

	// end inline asm
	// begin inline asm
	{  cvt.f32.f16 %f81, %rs15;}

	// end inline asm
	// begin inline asm
	{  cvt.f32.f16 %f349, %rs16;}

	// end inline asm

$L__BB0_29:
	and.pred  	%p43, %p2, %p4;
	not.pred 	%p44, %p43;
	mov.f32 	%f100, %f99;
	mov.f32 	%f101, %f99;
	mov.f32 	%f357, %f99;
	@%p44 bra 	$L__BB0_34;

	setp.eq.s32 	%p45, %r24, 0;
	@%p45 bra 	$L__BB0_32;

	ld.global.v4.f32 	{%f99, %f100, %f101, %f357}, [%rd7+16];
	bra.uni 	$L__BB0_34;

$L__BB0_32:
	ld.global.u16 	%rs17, [%rd8+8];
	ld.global.u16 	%rs18, [%rd8+10];
	ld.global.u16 	%rs19, [%rd8+12];
	ld.global.u16 	%rs20, [%rd8+14];
	// begin inline asm
	{  cvt.f32.f16 %f99, %rs17;}

	// end inline asm
	// begin inline asm
	{  cvt.f32.f16 %f100, %rs18;}

	// end inline asm
	// begin inline asm
	{  cvt.f32.f16 %f101, %rs19;}

	// end inline asm
	// begin inline asm
	{  cvt.f32.f16 %f357, %rs20;}

	// end inline asm

$L__BB0_34:
	mul.ftz.f32 	%f103, %f21, %f22;
	sub.ftz.f32 	%f104, %f21, %f103;
	sub.ftz.f32 	%f105, %f22, %f103;
	mov.f32 	%f244, 0f3F800000;
	sub.ftz.f32 	%f245, %f244, %f104;
	sub.ftz.f32 	%f246, %f245, %f105;
	sub.ftz.f32 	%f106, %f246, %f103;
	setp.eq.ftz.f32 	%p46, %f333, %f341;
	setp.eq.ftz.f32 	%p47, %f333, %f349;
	and.pred  	%p48, %p46, %p47;
	setp.eq.ftz.f32 	%p49, %f333, %f357;
	and.pred  	%p50, %p48, %p49;
	@%p50 bra 	$L__BB0_38;
	bra.uni 	$L__BB0_35;

$L__BB0_38:
	mul.ftz.f32 	%f284, %f104, %f59;
	fma.rn.ftz.f32 	%f285, %f106, %f39, %f284;
	mul.ftz.f32 	%f286, %f104, %f60;
	fma.rn.ftz.f32 	%f287, %f106, %f40, %f286;
	mul.ftz.f32 	%f288, %f104, %f61;
	fma.rn.ftz.f32 	%f289, %f106, %f41, %f288;
	fma.rn.ftz.f32 	%f290, %f105, %f79, %f285;
	fma.rn.ftz.f32 	%f291, %f105, %f80, %f287;
	fma.rn.ftz.f32 	%f292, %f105, %f81, %f289;
	fma.rn.ftz.f32 	%f361, %f103, %f99, %f290;
	fma.rn.ftz.f32 	%f360, %f103, %f100, %f291;
	fma.rn.ftz.f32 	%f359, %f103, %f101, %f292;
	mov.f32 	%f358, %f333;
	bra.uni 	$L__BB0_42;

$L__BB0_35:
	mul.ftz.f32 	%f247, %f104, %f341;
	fma.rn.ftz.f32 	%f248, %f106, %f333, %f247;
	fma.rn.ftz.f32 	%f249, %f105, %f349, %f248;
	fma.rn.ftz.f32 	%f123, %f103, %f357, %f249;
	setp.eq.ftz.f32 	%p51, %f123, 0f00000000;
	@%p51 bra 	$L__BB0_37;
	bra.uni 	$L__BB0_36;

$L__BB0_37:
	mul.ftz.f32 	%f275, %f104, %f59;
	fma.rn.ftz.f32 	%f276, %f106, %f39, %f275;
	mul.ftz.f32 	%f277, %f104, %f60;
	fma.rn.ftz.f32 	%f278, %f106, %f40, %f277;
	mul.ftz.f32 	%f279, %f104, %f61;
	fma.rn.ftz.f32 	%f280, %f106, %f41, %f279;
	fma.rn.ftz.f32 	%f281, %f105, %f79, %f276;
	fma.rn.ftz.f32 	%f282, %f105, %f80, %f278;
	fma.rn.ftz.f32 	%f283, %f105, %f81, %f280;
	fma.rn.ftz.f32 	%f361, %f103, %f99, %f281;
	fma.rn.ftz.f32 	%f360, %f103, %f100, %f282;
	fma.rn.ftz.f32 	%f359, %f103, %f101, %f283;
	mov.f32 	%f358, 0f00000000;
	bra.uni 	$L__BB0_42;

$L__BB0_36:
	setp.gt.ftz.f32 	%p52, %f123, 0f3F800000;
	selp.f32 	%f358, 0f3F800000, %f123, %p52;
	mul.ftz.f32 	%f250, %f41, %f333;
	mul.ftz.f32 	%f251, %f61, %f341;
	mul.ftz.f32 	%f252, %f104, %f251;
	fma.rn.ftz.f32 	%f253, %f106, %f250, %f252;
	mul.ftz.f32 	%f254, %f81, %f349;
	fma.rn.ftz.f32 	%f255, %f105, %f254, %f253;
	mul.ftz.f32 	%f256, %f101, %f357;
	fma.rn.ftz.f32 	%f257, %f103, %f256, %f255;
	div.approx.ftz.f32 	%f359, %f257, %f358;
	mul.ftz.f32 	%f258, %f40, %f333;
	mul.ftz.f32 	%f259, %f60, %f341;
	mul.ftz.f32 	%f260, %f104, %f259;
	fma.rn.ftz.f32 	%f261, %f106, %f258, %f260;
	mul.ftz.f32 	%f262, %f80, %f349;
	fma.rn.ftz.f32 	%f263, %f105, %f262, %f261;
	mul.ftz.f32 	%f264, %f100, %f357;
	fma.rn.ftz.f32 	%f265, %f103, %f264, %f263;
	div.approx.ftz.f32 	%f360, %f265, %f358;
	mul.ftz.f32 	%f266, %f39, %f333;
	mul.ftz.f32 	%f267, %f59, %f341;
	mul.ftz.f32 	%f268, %f104, %f267;
	fma.rn.ftz.f32 	%f269, %f106, %f266, %f268;
	mul.ftz.f32 	%f270, %f79, %f349;
	fma.rn.ftz.f32 	%f271, %f105, %f270, %f269;
	mul.ftz.f32 	%f272, %f99, %f357;
	fma.rn.ftz.f32 	%f273, %f103, %f272, %f271;
	div.approx.ftz.f32 	%f361, %f273, %f358;

$L__BB0_42:
	ld.const.f32 	%f302, [kRGB32f_To_601YPbPr];
	ld.const.f32 	%f303, [kRGB32f_To_601YPbPr+4];
	mul.ftz.f32 	%f304, %f360, %f303;
	fma.rn.ftz.f32 	%f305, %f359, %f302, %f304;
	ld.const.f32 	%f306, [kRGB32f_To_601YPbPr+8];
	fma.rn.ftz.f32 	%f307, %f361, %f306, %f305;
	cvt.ftz.sat.f32.f32 	%f308, %f307;
	mul.ftz.f32 	%f147, %f358, %f308;
	add.ftz.f32 	%f309, %f147, 0fB70637BD;
	setp.le.ftz.f32 	%p54, %f309, %f153;
	@%p54 bra 	$L__BB0_45;

	add.ftz.f32 	%f311, %f147, 0f370637BD;
	setp.ge.ftz.f32 	%p55, %f311, %f154;
	mov.f32 	%f362, 0f3F800000;
	@%p55 bra 	$L__BB0_45;

	sub.ftz.f32 	%f312, %f147, %f153;
	sub.ftz.f32 	%f313, %f154, %f153;
	div.approx.ftz.f32 	%f362, %f312, %f313;

$L__BB0_45:
	sub.ftz.f32 	%f314, %f156, %f155;
	fma.rn.ftz.f32 	%f315, %f314, %f362, %f155;
	mul.ftz.f32 	%f320, %f320, %f315;

$L__BB0_46:
	mad.lo.s32 	%r49, %r22, %r2, %r1;
	cvt.s64.s32 	%rd10, %r49;
	setp.eq.s32 	%p56, %r24, 0;
	@%p56 bra 	$L__BB0_48;

	shl.b64 	%rd26, %rd10, 4;
	add.s64 	%rd27, %rd1, %rd26;
	st.global.v4.f32 	[%rd27], {%f323, %f322, %f321, %f320};
	bra.uni 	$L__BB0_49;

$L__BB0_48:
	// begin inline asm
	{  cvt.rn.f16.f32 %rs25, %f323;}

	// end inline asm
	// begin inline asm
	{  cvt.rn.f16.f32 %rs26, %f322;}

	// end inline asm
	// begin inline asm
	{  cvt.rn.f16.f32 %rs27, %f321;}

	// end inline asm
	// begin inline asm
	{  cvt.rn.f16.f32 %rs28, %f320;}

	// end inline asm
	shl.b64 	%rd28, %rd10, 3;
	add.s64 	%rd29, %rd1, %rd28;
	st.global.u16 	[%rd29], %rs25;
	st.global.u16 	[%rd29+2], %rs26;
	st.global.u16 	[%rd29+4], %rs27;
	st.global.u16 	[%rd29+6], %rs28;

$L__BB0_49:
	ret;

}

  ELF3         ~           @,       )      V2 @ 8  @    .shstrtab .strtab .symtab .symtab_shndx .nv.info .text.GradientWipeKernel .nv.info.GradientWipeKernel .nv.shared.GradientWipeKernel .nv.constant3 .nv.constant0.GradientWipeKernel .rel.nv.constant0.GradientWipeKernel .debug_frame .rel.debug_frame .rela.debug_frame .nv.callgraph .nv.prototype .nv.rel.action  .shstrtab .strtab .symtab .symtab_shndx .nv.info .text.GradientWipeKernel .nv.info.GradientWipeKernel .nv.shared.GradientWipeKernel .nv.constant3 kRGB32f_To_601YPbPr k601YPbPr_To_RGB32f kRGB32f_To_601YCbCr k601YCbCr_To_RGB32f kRGB8u_To_601YCbCr k601YCbCr_To_RGB8u kRGB8u_To_601YCbCrFullRange k601YCbCrFullRange_To_RGB8u kRGB32f_To_601YCbCrFullRange k601YCbCrFullRange_To_RGB32f kRGB32f_To_709YPbPr k709YPbPr_To_RGB32f kRGB32f_To_709YCbCr k709YCbCr_To_RGB32f k709YCbCrFullRange_To_RGB32f kRGB8u_To_709YCbCr k709YCbCr_To_RGB8u k709YCbCr_To_601YCbCr k601YCbCr_To_709YCbCr kZeroMatrix kYCbCrOffset kYCbCrFullRangeOffset PQ_m1 PQ_m1Inv PQ_m2 PQ_m2Inv PQ_c1 PQ_c2 PQ_c3 Gamma1886 PQ_Lpeak PQ_a PQ_b PQ_c PQ_s PQ_g scaleFD HLG_a HLG_b HLG_c HLG_inva HLG_alpha HLG_invAlpha HLG_gamma HLG_gammaM1 HLG_gammaM1Dgamma HLG_YR HLG_YG HLG_YB HLG_Lpeak kRandMax .rel.nv.constant0.GradientWipeKernel .nv.constant0.GradientWipeKernel .debug_frame .rel.debug_frame .rela.debug_frame .nv.callgraph .nv.prototype .nv.rel.action GradientWipeKernel inBilinearSrc inPointSrc                         2                         
                     
         $           
 $       $           
 H       $           
 l       $           
        $           
        $       	   
        $       %   
        $       A   
        $       ^   
 D      $       {   
 h      $          
       $          
       $          
       $          
       $          
       $          
 @      $          
 d      $       $   
       $       :   
       $       F   
              S   
              i   
              o   
              x   
              ~   
                 
                 
                 
                  
                 
                 
                 
                 
                 
                 
                 
                  
 $                
 (                
 ,                
 0                
 4                
 8                
 <             	   
 @                
 D             '   
 H             .   
 L             5   
 P             <   
 T             F   
 X             t                                                                                                                                           $        |( ((   4                                $   ( 8         / :   $    :        :       7 ~   5  
 6   `| |       x        
 t        	 p         `  A       X         P  !       @  A       0  A          A         !         !           !                                   s          % 6D          :   >E?x=!,o   ?   ?F^־膦  ?    t?  ?26  ??    FB C^A!0g  B  BoF%;    ;%;(ɺP%;<    y>?=>>NG
?    J?
?ȾP
?N@    >E?x=,'>>+վ;ߥ  ?    H?  ?6  ??    q}B\C\Ao+1H  B  BX9;    t;;26;;    гY>Y7?ݓ=Vž   ?   ?;  ?    ?  ??  ?M?    j<:BC|AO  B  BuQ$%;    ^;%;!9[%;R<    ;    ;;=?ﺃ;R;    :>5>?}=νY>>B̾$
?    x?
?5^Zl
?1@      ?d=MD>    g}?
    =b{?  ?z콳T    b?ؼ=    J==?                                      A   C   C       C   C  #>k@ BO<  V? ЖA A@ @F?VnB39Cff>  B7> >OV?)@   A=?L>*>>h-?r=  zD                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              z  
       y      &   ( y       "   ( y      %   h y      !   b $z      z  i  p`  $z     / z  h  pdp   M	          z  l    z  F   
    z m    Ey        z  u  pR  x         r      x         r    pb  z   `  pfp  z  a  pfp   G	         z  n  pR  $z  b     x       
  X      X   
	  Y  $   Y    	     h             
    (     " 0    A   O 0     A    0
    A   0    A    Ay          G        $v  v     x     pR  G        x     pR  G         x     pR  x         G	        Ez	  i       Ez   h       Ez  d       s         " Ez  e       Er         Er         s	 	       b  r     A    r     A    r	     A  /  r     A   Gy        z  d   
    Er         z  h   
    Er          r  ?  r  ?  E|        E|        #x   ?    #x   ?     Gy  @      {   d      " z  e  pP  {
  e      p s          0 s
 
       b. x   s     !    x
 / s	     !   r         r   O $r     / $z d    $r   	
  'r      $z e    'r      'r 	      r     'r        $z d    r       z  d  p`  $z  e    z  e  p`  
 d   z  d  p`   e   z  d  pP  z  e  p`  
 d    d  3  * e    e  3  Er         Er         Ez  d       Ey  0      r     ` x
         Ez   e       x         r       r     ` r        $r       x      W  x      p   G	  p      z  t  pR  G  0
      s     q!  " x         Ey `      x         x         x
         s     q!  b z  d  pb x    x pB  z  d  pb  z  e  pb /x     x pBt  Er         $z f   x      pP   Er         !r       z  e  pb  x pBp  $z f   x pB  !r       x         %v Z    x      pPt   x         %v Z    G         z  n  pR        I     h          (     " 0    A   O 0	    A    0
    A   0    A    Ay         Ey        G         z  n  pR       )    h 
         (     " 0    A   O 0    A    0    A   0    A    Ay         x      pp   Ey        %v Z    x      ppp   x         x         $r      %v Z    G         z  n  pR             h          (     " 0    A   O 0    A    0    A   0    A    Ay         Ey        r         x         G         z  n  pR  !     	    h 
         (      " 0!    A   O 0    A    0    A   0     A    Ay         r       r     A   r      r       !r      !r       x       p  !t  ?    !r       !r       G	          r     A   #r       #r       #r       r       G         r     A   r     A   r     A    r

     A   r	     A   r     A   	x  ?     r     A   r	     A   r     A    r     A  s        "  r     A   #r

        r     A   #r   	   #r        r     A   r     A   #r
   
     r     A   #r      #r       #r	   
    #r      #r        r
	     A   r	     A   r     A   Gy         r     A   r     A   r     A   r         #r      #r	      #r
       #r      #r      #r       #r      #r	      #r
       Gy         r     A   r     A   r     A   #r      #r	      #r
       #r      #r      #r       #r      #r	      #r
       Gy         s     !   z  n  pR  s     !  $ $z f    x      * Z     Z   * [  $   [     )     h                (     " 0    A   O 0	    A    0
    A   0    A    Ay           z		    A  Ey         #z	
   	    #z  	    $v	 r     !r        !v		 s       r     A   !t7     z  p     G         !t 77     z   q   `  x    ?       q       ! p      ! p              $        A   Ay          #v 	 r        r      A   z  n  pR  $z j    x	       \      ]  	$        M          z \   >r        >r        z ]  	   x 2v        x2v       y      y      y     y     My          Gy    y            y            y            y            y            y            y            y            y            y            y            y            y            y                                                                                                  @       4                                                   t                                                                        :                                       H      p                              )      p                      $                             K      p@                                                 	    p                                                   %    p                                                      	   @                                                                           \                                   B               t                                  2                                    :  $                     @,                                                                                                @,                                           