/* { dg-final { check-function-bodies "**" "" "-DCHECK_ASM" } } */

#include "test_sve_acle.h"

/*
** cvt_f64_f16_m_tied1:
**	fcvt	z0\.d, p0/m, z4\.h
**	ret
*/
TEST_DUAL_Z (cvt_f64_f16_m_tied1, svfloat64_t, svfloat16_t,
	     z0 = svcvt_f64_f16_m (z0, p0, z4),
	     z0 = svcvt_f64_m (z0, p0, z4))

/*
** cvt_f64_f16_m_tied2:
**	mov	(z[0-9]+)\.d, z0\.d
**	movprfx	z0, z4
**	fcvt	z0\.d, p0/m, \1\.h
**	ret
*/
TEST_DUAL_Z_REV (cvt_f64_f16_m_tied2, svfloat64_t, svfloat16_t,
		 z0_res = svcvt_f64_f16_m (z4, p0, z0),
		 z0_res = svcvt_f64_m (z4, p0, z0))

/*
** cvt_f64_f16_m_untied:
**	movprfx	z0, z1
**	fcvt	z0\.d, p0/m, z4\.h
**	ret
*/
TEST_DUAL_Z (cvt_f64_f16_m_untied, svfloat64_t, svfloat16_t,
	     z0 = svcvt_f64_f16_m (z1, p0, z4),
	     z0 = svcvt_f64_m (z1, p0, z4))

/*
** cvt_f64_f32_m_tied1:
**	fcvt	z0\.d, p0/m, z4\.s
**	ret
*/
TEST_DUAL_Z (cvt_f64_f32_m_tied1, svfloat64_t, svfloat32_t,
	     z0 = svcvt_f64_f32_m (z0, p0, z4),
	     z0 = svcvt_f64_m (z0, p0, z4))

/*
** cvt_f64_f32_m_tied2:
**	mov	(z[0-9]+)\.d, z0\.d
**	movprfx	z0, z4
**	fcvt	z0\.d, p0/m, \1\.s
**	ret
*/
TEST_DUAL_Z_REV (cvt_f64_f32_m_tied2, svfloat64_t, svfloat32_t,
		 z0_res = svcvt_f64_f32_m (z4, p0, z0),
		 z0_res = svcvt_f64_m (z4, p0, z0))

/*
** cvt_f64_f32_m_untied:
**	movprfx	z0, z1
**	fcvt	z0\.d, p0/m, z4\.s
**	ret
*/
TEST_DUAL_Z (cvt_f64_f32_m_untied, svfloat64_t, svfloat32_t,
	     z0 = svcvt_f64_f32_m (z1, p0, z4),
	     z0 = svcvt_f64_m (z1, p0, z4))

/*
** cvt_f64_s32_m_tied1:
**	scvtf	z0\.d, p0/m, z4\.s
**	ret
*/
TEST_DUAL_Z (cvt_f64_s32_m_tied1, svfloat64_t, svint32_t,
	     z0 = svcvt_f64_s32_m (z0, p0, z4),
	     z0 = svcvt_f64_m (z0, p0, z4))

/*
** cvt_f64_s32_m_tied2:
**	mov	(z[0-9]+)\.d, z0\.d
**	movprfx	z0, z4
**	scvtf	z0\.d, p0/m, \1\.s
**	ret
*/
TEST_DUAL_Z_REV (cvt_f64_s32_m_tied2, svfloat64_t, svint32_t,
		 z0_res = svcvt_f64_s32_m (z4, p0, z0),
		 z0_res = svcvt_f64_m (z4, p0, z0))

/*
** cvt_f64_s32_m_untied:
**	movprfx	z0, z1
**	scvtf	z0\.d, p0/m, z4\.s
**	ret
*/
TEST_DUAL_Z (cvt_f64_s32_m_untied, svfloat64_t, svint32_t,
	     z0 = svcvt_f64_s32_m (z1, p0, z4),
	     z0 = svcvt_f64_m (z1, p0, z4))

/*
** cvt_f64_s64_m_tied1:
**	scvtf	z0\.d, p0/m, z4\.d
**	ret
*/
TEST_DUAL_Z (cvt_f64_s64_m_tied1, svfloat64_t, svint64_t,
	     z0 = svcvt_f64_s64_m (z0, p0, z4),
	     z0 = svcvt_f64_m (z0, p0, z4))

/*
** cvt_f64_s64_m_tied2:
**	mov	(z[0-9]+\.d), z0\.d
**	movprfx	z0, z4
**	scvtf	z0\.d, p0/m, \1
**	ret
*/
TEST_DUAL_Z_REV (cvt_f64_s64_m_tied2, svfloat64_t, svint64_t,
		 z0_res = svcvt_f64_s64_m (z4, p0, z0),
		 z0_res = svcvt_f64_m (z4, p0, z0))

/*
** cvt_f64_s64_m_untied:
**	movprfx	z0, z1
**	scvtf	z0\.d, p0/m, z4\.d
**	ret
*/
TEST_DUAL_Z (cvt_f64_s64_m_untied, svfloat64_t, svint64_t,
	     z0 = svcvt_f64_s64_m (z1, p0, z4),
	     z0 = svcvt_f64_m (z1, p0, z4))

/*
** cvt_f64_u32_m_tied1:
**	ucvtf	z0\.d, p0/m, z4\.s
**	ret
*/
TEST_DUAL_Z (cvt_f64_u32_m_tied1, svfloat64_t, svuint32_t,
	     z0 = svcvt_f64_u32_m (z0, p0, z4),
	     z0 = svcvt_f64_m (z0, p0, z4))

/*
** cvt_f64_u32_m_tied2:
**	mov	(z[0-9]+)\.d, z0\.d
**	movprfx	z0, z4
**	ucvtf	z0\.d, p0/m, \1\.s
**	ret
*/
TEST_DUAL_Z_REV (cvt_f64_u32_m_tied2, svfloat64_t, svuint32_t,
		 z0_res = svcvt_f64_u32_m (z4, p0, z0),
		 z0_res = svcvt_f64_m (z4, p0, z0))

/*
** cvt_f64_u32_m_untied:
**	movprfx	z0, z1
**	ucvtf	z0\.d, p0/m, z4\.s
**	ret
*/
TEST_DUAL_Z (cvt_f64_u32_m_untied, svfloat64_t, svuint32_t,
	     z0 = svcvt_f64_u32_m (z1, p0, z4),
	     z0 = svcvt_f64_m (z1, p0, z4))

/*
** cvt_f64_u64_m_tied1:
**	ucvtf	z0\.d, p0/m, z4\.d
**	ret
*/
TEST_DUAL_Z (cvt_f64_u64_m_tied1, svfloat64_t, svuint64_t,
	     z0 = svcvt_f64_u64_m (z0, p0, z4),
	     z0 = svcvt_f64_m (z0, p0, z4))

/*
** cvt_f64_u64_m_tied2:
**	mov	(z[0-9]+\.d), z0\.d
**	movprfx	z0, z4
**	ucvtf	z0\.d, p0/m, \1
**	ret
*/
TEST_DUAL_Z_REV (cvt_f64_u64_m_tied2, svfloat64_t, svuint64_t,
		 z0_res = svcvt_f64_u64_m (z4, p0, z0),
		 z0_res = svcvt_f64_m (z4, p0, z0))

/*
** cvt_f64_u64_m_untied:
**	movprfx	z0, z1
**	ucvtf	z0\.d, p0/m, z4\.d
**	ret
*/
TEST_DUAL_Z (cvt_f64_u64_m_untied, svfloat64_t, svuint64_t,
	     z0 = svcvt_f64_u64_m (z1, p0, z4),
	     z0 = svcvt_f64_m (z1, p0, z4))

/*
** cvt_f64_f16_z_tied1:
**	mov	(z[0-9]+)\.d, z0\.d
**	movprfx	z0\.d, p0/z, \1\.d
**	fcvt	z0\.d, p0/m, \1\.h
**	ret
*/
TEST_DUAL_Z_REV (cvt_f64_f16_z_tied1, svfloat64_t, svfloat16_t,
		 z0_res = svcvt_f64_f16_z (p0, z0),
		 z0_res = svcvt_f64_z (p0, z0))

/*
** cvt_f64_f16_z_untied:
**	movprfx	z0\.d, p0/z, z4\.d
**	fcvt	z0\.d, p0/m, z4\.h
**	ret
*/
TEST_DUAL_Z (cvt_f64_f16_z_untied, svfloat64_t, svfloat16_t,
	     z0 = svcvt_f64_f16_z (p0, z4),
	     z0 = svcvt_f64_z (p0, z4))

/*
** cvt_f64_f32_z_tied1:
**	mov	(z[0-9]+)\.d, z0\.d
**	movprfx	z0\.d, p0/z, \1\.d
**	fcvt	z0\.d, p0/m, \1\.s
**	ret
*/
TEST_DUAL_Z_REV (cvt_f64_f32_z_tied1, svfloat64_t, svfloat32_t,
		 z0_res = svcvt_f64_f32_z (p0, z0),
		 z0_res = svcvt_f64_z (p0, z0))

/*
** cvt_f64_f32_z_untied:
**	movprfx	z0\.d, p0/z, z4\.d
**	fcvt	z0\.d, p0/m, z4\.s
**	ret
*/
TEST_DUAL_Z (cvt_f64_f32_z_untied, svfloat64_t, svfloat32_t,
	     z0 = svcvt_f64_f32_z (p0, z4),
	     z0 = svcvt_f64_z (p0, z4))

/*
** cvt_f64_s32_z_tied1:
**	mov	(z[0-9]+)\.d, z0\.d
**	movprfx	z0\.d, p0/z, \1\.d
**	scvtf	z0\.d, p0/m, \1\.s
**	ret
*/
TEST_DUAL_Z_REV (cvt_f64_s32_z_tied1, svfloat64_t, svint32_t,
		 z0_res = svcvt_f64_s32_z (p0, z0),
		 z0_res = svcvt_f64_z (p0, z0))

/*
** cvt_f64_s32_z_untied:
**	movprfx	z0\.d, p0/z, z4\.d
**	scvtf	z0\.d, p0/m, z4\.s
**	ret
*/
TEST_DUAL_Z (cvt_f64_s32_z_untied, svfloat64_t, svint32_t,
	     z0 = svcvt_f64_s32_z (p0, z4),
	     z0 = svcvt_f64_z (p0, z4))

/*
** cvt_f64_s64_z_tied1:
**	mov	(z[0-9]+\.d), z0\.d
**	movprfx	z0\.d, p0/z, \1
**	scvtf	z0\.d, p0/m, \1
**	ret
*/
TEST_DUAL_Z_REV (cvt_f64_s64_z_tied1, svfloat64_t, svint64_t,
		 z0_res = svcvt_f64_s64_z (p0, z0),
		 z0_res = svcvt_f64_z (p0, z0))

/*
** cvt_f64_s64_z_untied:
**	movprfx	z0\.d, p0/z, z4\.d
**	scvtf	z0\.d, p0/m, z4\.d
**	ret
*/
TEST_DUAL_Z (cvt_f64_s64_z_untied, svfloat64_t, svint64_t,
	     z0 = svcvt_f64_s64_z (p0, z4),
	     z0 = svcvt_f64_z (p0, z4))

/*
** cvt_f64_u32_z_tied1:
**	mov	(z[0-9]+)\.d, z0\.d
**	movprfx	z0\.d, p0/z, \1\.d
**	ucvtf	z0\.d, p0/m, \1\.s
**	ret
*/
TEST_DUAL_Z_REV (cvt_f64_u32_z_tied1, svfloat64_t, svuint32_t,
		 z0_res = svcvt_f64_u32_z (p0, z0),
		 z0_res = svcvt_f64_z (p0, z0))

/*
** cvt_f64_u32_z_untied:
**	movprfx	z0\.d, p0/z, z4\.d
**	ucvtf	z0\.d, p0/m, z4\.s
**	ret
*/
TEST_DUAL_Z (cvt_f64_u32_z_untied, svfloat64_t, svuint32_t,
	     z0 = svcvt_f64_u32_z (p0, z4),
	     z0 = svcvt_f64_z (p0, z4))

/*
** cvt_f64_u64_z_tied1:
**	mov	(z[0-9]+\.d), z0\.d
**	movprfx	z0\.d, p0/z, \1
**	ucvtf	z0\.d, p0/m, \1
**	ret
*/
TEST_DUAL_Z_REV (cvt_f64_u64_z_tied1, svfloat64_t, svuint64_t,
		 z0_res = svcvt_f64_u64_z (p0, z0),
		 z0_res = svcvt_f64_z (p0, z0))

/*
** cvt_f64_u64_z_untied:
**	movprfx	z0\.d, p0/z, z4\.d
**	ucvtf	z0\.d, p0/m, z4\.d
**	ret
*/
TEST_DUAL_Z (cvt_f64_u64_z_untied, svfloat64_t, svuint64_t,
	     z0 = svcvt_f64_u64_z (p0, z4),
	     z0 = svcvt_f64_z (p0, z4))

/*
** cvt_f64_f16_x_tied1:
**	fcvt	z0\.d, p0/m, z0\.h
**	ret
*/
TEST_DUAL_Z_REV (cvt_f64_f16_x_tied1, svfloat64_t, svfloat16_t,
		 z0_res = svcvt_f64_f16_x (p0, z0),
		 z0_res = svcvt_f64_x (p0, z0))

/*
** cvt_f64_f16_x_untied:
**	movprfx	z0, z4
**	fcvt	z0\.d, p0/m, z4\.h
**	ret
*/
TEST_DUAL_Z (cvt_f64_f16_x_untied, svfloat64_t, svfloat16_t,
	     z0 = svcvt_f64_f16_x (p0, z4),
	     z0 = svcvt_f64_x (p0, z4))

/*
** cvt_f64_f32_x_tied1:
**	fcvt	z0\.d, p0/m, z0\.s
**	ret
*/
TEST_DUAL_Z_REV (cvt_f64_f32_x_tied1, svfloat64_t, svfloat32_t,
		 z0_res = svcvt_f64_f32_x (p0, z0),
		 z0_res = svcvt_f64_x (p0, z0))

/*
** cvt_f64_f32_x_untied:
**	movprfx	z0, z4
**	fcvt	z0\.d, p0/m, z4\.s
**	ret
*/
TEST_DUAL_Z (cvt_f64_f32_x_untied, svfloat64_t, svfloat32_t,
	     z0 = svcvt_f64_f32_x (p0, z4),
	     z0 = svcvt_f64_x (p0, z4))

/*
** cvt_f64_s32_x_tied1:
**	scvtf	z0\.d, p0/m, z0\.s
**	ret
*/
TEST_DUAL_Z_REV (cvt_f64_s32_x_tied1, svfloat64_t, svint32_t,
		 z0_res = svcvt_f64_s32_x (p0, z0),
		 z0_res = svcvt_f64_x (p0, z0))

/*
** cvt_f64_s32_x_untied:
**	movprfx	z0, z4
**	scvtf	z0\.d, p0/m, z4\.s
**	ret
*/
TEST_DUAL_Z (cvt_f64_s32_x_untied, svfloat64_t, svint32_t,
	     z0 = svcvt_f64_s32_x (p0, z4),
	     z0 = svcvt_f64_x (p0, z4))

/*
** cvt_f64_s64_x_tied1:
**	scvtf	z0\.d, p0/m, z0\.d
**	ret
*/
TEST_DUAL_Z_REV (cvt_f64_s64_x_tied1, svfloat64_t, svint64_t,
		 z0_res = svcvt_f64_s64_x (p0, z0),
		 z0_res = svcvt_f64_x (p0, z0))

/*
** cvt_f64_s64_x_untied:
**	movprfx	z0, z4
**	scvtf	z0\.d, p0/m, z4\.d
**	ret
*/
TEST_DUAL_Z (cvt_f64_s64_x_untied, svfloat64_t, svint64_t,
	     z0 = svcvt_f64_s64_x (p0, z4),
	     z0 = svcvt_f64_x (p0, z4))

/*
** cvt_f64_u32_x_tied1:
**	ucvtf	z0\.d, p0/m, z0\.s
**	ret
*/
TEST_DUAL_Z_REV (cvt_f64_u32_x_tied1, svfloat64_t, svuint32_t,
		 z0_res = svcvt_f64_u32_x (p0, z0),
		 z0_res = svcvt_f64_x (p0, z0))

/*
** cvt_f64_u32_x_untied:
**	movprfx	z0, z4
**	ucvtf	z0\.d, p0/m, z4\.s
**	ret
*/
TEST_DUAL_Z (cvt_f64_u32_x_untied, svfloat64_t, svuint32_t,
	     z0 = svcvt_f64_u32_x (p0, z4),
	     z0 = svcvt_f64_x (p0, z4))

/*
** cvt_f64_u64_x_tied1:
**	ucvtf	z0\.d, p0/m, z0\.d
**	ret
*/
TEST_DUAL_Z_REV (cvt_f64_u64_x_tied1, svfloat64_t, svuint64_t,
		 z0_res = svcvt_f64_u64_x (p0, z0),
		 z0_res = svcvt_f64_x (p0, z0))

/*
** cvt_f64_u64_x_untied:
**	movprfx	z0, z4
**	ucvtf	z0\.d, p0/m, z4\.d
**	ret
*/
TEST_DUAL_Z (cvt_f64_u64_x_untied, svfloat64_t, svuint64_t,
	     z0 = svcvt_f64_u64_x (p0, z4),
	     z0 = svcvt_f64_x (p0, z4))

/*
** ptrue_cvt_f64_f16_x_tied1:
**	...
**	ptrue	p[0-9]+\.b[^\n]*
**	...
**	ret
*/
TEST_DUAL_Z_REV (ptrue_cvt_f64_f16_x_tied1, svfloat64_t, svfloat16_t,
		 z0_res = svcvt_f64_f16_x (svptrue_b64 (), z0),
		 z0_res = svcvt_f64_x (svptrue_b64 (), z0))

/*
** ptrue_cvt_f64_f16_x_untied:
**	...
**	ptrue	p[0-9]+\.b[^\n]*
**	...
**	ret
*/
TEST_DUAL_Z (ptrue_cvt_f64_f16_x_untied, svfloat64_t, svfloat16_t,
	     z0 = svcvt_f64_f16_x (svptrue_b64 (), z4),
	     z0 = svcvt_f64_x (svptrue_b64 (), z4))

/*
** ptrue_cvt_f64_f32_x_tied1:
**	...
**	ptrue	p[0-9]+\.b[^\n]*
**	...
**	ret
*/
TEST_DUAL_Z_REV (ptrue_cvt_f64_f32_x_tied1, svfloat64_t, svfloat32_t,
		 z0_res = svcvt_f64_f32_x (svptrue_b64 (), z0),
		 z0_res = svcvt_f64_x (svptrue_b64 (), z0))

/*
** ptrue_cvt_f64_f32_x_untied:
**	...
**	ptrue	p[0-9]+\.b[^\n]*
**	...
**	ret
*/
TEST_DUAL_Z (ptrue_cvt_f64_f32_x_untied, svfloat64_t, svfloat32_t,
	     z0 = svcvt_f64_f32_x (svptrue_b64 (), z4),
	     z0 = svcvt_f64_x (svptrue_b64 (), z4))

/*
** ptrue_cvt_f64_s32_x_tied1:
**	...
**	ptrue	p[0-9]+\.b[^\n]*
**	...
**	ret
*/
TEST_DUAL_Z_REV (ptrue_cvt_f64_s32_x_tied1, svfloat64_t, svint32_t,
		 z0_res = svcvt_f64_s32_x (svptrue_b64 (), z0),
		 z0_res = svcvt_f64_x (svptrue_b64 (), z0))

/*
** ptrue_cvt_f64_s32_x_untied:
**	...
**	ptrue	p[0-9]+\.b[^\n]*
**	...
**	ret
*/
TEST_DUAL_Z (ptrue_cvt_f64_s32_x_untied, svfloat64_t, svint32_t,
	     z0 = svcvt_f64_s32_x (svptrue_b64 (), z4),
	     z0 = svcvt_f64_x (svptrue_b64 (), z4))

/*
** ptrue_cvt_f64_s64_x_tied1:
**	...
**	ptrue	p[0-9]+\.b[^\n]*
**	...
**	ret
*/
TEST_DUAL_Z_REV (ptrue_cvt_f64_s64_x_tied1, svfloat64_t, svint64_t,
		 z0_res = svcvt_f64_s64_x (svptrue_b64 (), z0),
		 z0_res = svcvt_f64_x (svptrue_b64 (), z0))

/*
** ptrue_cvt_f64_s64_x_untied:
**	...
**	ptrue	p[0-9]+\.b[^\n]*
**	...
**	ret
*/
TEST_DUAL_Z (ptrue_cvt_f64_s64_x_untied, svfloat64_t, svint64_t,
	     z0 = svcvt_f64_s64_x (svptrue_b64 (), z4),
	     z0 = svcvt_f64_x (svptrue_b64 (), z4))

/*
** ptrue_cvt_f64_u32_x_tied1:
**	...
**	ptrue	p[0-9]+\.b[^\n]*
**	...
**	ret
*/
TEST_DUAL_Z_REV (ptrue_cvt_f64_u32_x_tied1, svfloat64_t, svuint32_t,
		 z0_res = svcvt_f64_u32_x (svptrue_b64 (), z0),
		 z0_res = svcvt_f64_x (svptrue_b64 (), z0))

/*
** ptrue_cvt_f64_u32_x_untied:
**	...
**	ptrue	p[0-9]+\.b[^\n]*
**	...
**	ret
*/
TEST_DUAL_Z (ptrue_cvt_f64_u32_x_untied, svfloat64_t, svuint32_t,
	     z0 = svcvt_f64_u32_x (svptrue_b64 (), z4),
	     z0 = svcvt_f64_x (svptrue_b64 (), z4))

/*
** ptrue_cvt_f64_u64_x_tied1:
**	...
**	ptrue	p[0-9]+\.b[^\n]*
**	...
**	ret
*/
TEST_DUAL_Z_REV (ptrue_cvt_f64_u64_x_tied1, svfloat64_t, svuint64_t,
		 z0_res = svcvt_f64_u64_x (svptrue_b64 (), z0),
		 z0_res = svcvt_f64_x (svptrue_b64 (), z0))

/*
** ptrue_cvt_f64_u64_x_untied:
**	...
**	ptrue	p[0-9]+\.b[^\n]*
**	...
**	ret
*/
TEST_DUAL_Z (ptrue_cvt_f64_u64_x_untied, svfloat64_t, svuint64_t,
	     z0 = svcvt_f64_u64_x (svptrue_b64 (), z4),
	     z0 = svcvt_f64_x (svptrue_b64 (), z4))
