Skip to content

Commit c49ec83

Browse files
committed
Add f16 inline asm support for LoongArch
1 parent 8da6239 commit c49ec83

File tree

3 files changed

+51
-4
lines changed

3 files changed

+51
-4
lines changed

compiler/rustc_codegen_llvm/src/asm.rs

Lines changed: 21 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1021,6 +1021,15 @@ fn llvm_fixup_input<'ll, 'tcx>(
10211021
) if element.primitive() == Primitive::Float(Float::F16) => {
10221022
bx.bitcast(value, bx.type_vector(bx.type_i16(), count))
10231023
}
1024+
(LoongArch(LoongArchInlineAsmRegClass::freg), BackendRepr::Scalar(s))
1025+
if s.primitive() == Primitive::Float(Float::F16) =>
1026+
{
1027+
// Smaller floats are always "NaN-boxed" inside larger floats on LoongArch.
1028+
let value = bx.bitcast(value, bx.type_i16());
1029+
let value = bx.zext(value, bx.type_i32());
1030+
let value = bx.or(value, bx.const_u32(0xFFFF_0000));
1031+
bx.bitcast(value, bx.type_f32())
1032+
}
10241033
(Mips(MipsInlineAsmRegClass::reg), BackendRepr::Scalar(s)) => {
10251034
match s.primitive() {
10261035
// MIPS only supports register-length arithmetics.
@@ -1178,6 +1187,13 @@ fn llvm_fixup_output<'ll, 'tcx>(
11781187
) if element.primitive() == Primitive::Float(Float::F16) => {
11791188
bx.bitcast(value, bx.type_vector(bx.type_f16(), count))
11801189
}
1190+
(LoongArch(LoongArchInlineAsmRegClass::freg), BackendRepr::Scalar(s))
1191+
if s.primitive() == Primitive::Float(Float::F16) =>
1192+
{
1193+
let value = bx.bitcast(value, bx.type_i32());
1194+
let value = bx.trunc(value, bx.type_i16());
1195+
bx.bitcast(value, bx.type_f16())
1196+
}
11811197
(Mips(MipsInlineAsmRegClass::reg), BackendRepr::Scalar(s)) => {
11821198
match s.primitive() {
11831199
// MIPS only supports register-length arithmetics.
@@ -1318,6 +1334,11 @@ fn llvm_fixup_output_type<'ll, 'tcx>(
13181334
) if element.primitive() == Primitive::Float(Float::F16) => {
13191335
cx.type_vector(cx.type_i16(), count)
13201336
}
1337+
(LoongArch(LoongArchInlineAsmRegClass::freg), BackendRepr::Scalar(s))
1338+
if s.primitive() == Primitive::Float(Float::F16) =>
1339+
{
1340+
cx.type_f32()
1341+
}
13211342
(Mips(MipsInlineAsmRegClass::reg), BackendRepr::Scalar(s)) => {
13221343
match s.primitive() {
13231344
// MIPS only supports register-length arithmetics.

compiler/rustc_target/src/asm/loongarch.rs

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -37,9 +37,11 @@ impl LoongArchInlineAsmRegClass {
3737
arch: InlineAsmArch,
3838
) -> &'static [(InlineAsmType, Option<Symbol>)] {
3939
match (self, arch) {
40-
(Self::reg, InlineAsmArch::LoongArch64) => types! { _: I8, I16, I32, I64, F32, F64; },
41-
(Self::reg, InlineAsmArch::LoongArch32) => types! { _: I8, I16, I32, F32; },
42-
(Self::freg, _) => types! { f: F32; d: F64; },
40+
(Self::reg, InlineAsmArch::LoongArch64) => {
41+
types! { _: I8, I16, I32, I64, F16, F32, F64; }
42+
}
43+
(Self::reg, InlineAsmArch::LoongArch32) => types! { _: I8, I16, I32, F16, F32; },
44+
(Self::freg, _) => types! { f: F16, F32; d: F64; },
4345
_ => unreachable!("unsupported register class"),
4446
}
4547
}

tests/assembly/asm/loongarch-type.rs

Lines changed: 25 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@
44
//@ compile-flags: -Zmerge-functions=disabled
55
//@ needs-llvm-components: loongarch
66

7-
#![feature(no_core)]
7+
#![feature(no_core, f16)]
88
#![crate_type = "rlib"]
99
#![no_core]
1010
#![allow(asm_sub_register, non_camel_case_types)]
@@ -69,6 +69,12 @@ check!(reg_i8, i8, reg, "move");
6969
// CHECK: #NO_APP
7070
check!(reg_i16, i16, reg, "move");
7171

72+
// CHECK-LABEL: reg_f16:
73+
// CHECK: #APP
74+
// CHECK: move ${{[a-z0-9]+}}, ${{[a-z0-9]+}}
75+
// CHECK: #NO_APP
76+
check!(reg_f16, f16, reg, "move");
77+
7278
// CHECK-LABEL: reg_i32:
7379
// CHECK: #APP
7480
// CHECK: move ${{[a-z0-9]+}}, ${{[a-z0-9]+}}
@@ -99,6 +105,12 @@ check!(reg_f64, f64, reg, "move");
99105
// CHECK: #NO_APP
100106
check!(reg_ptr, ptr, reg, "move");
101107

108+
// CHECK-LABEL: freg_f16:
109+
// CHECK: #APP
110+
// CHECK: fmov.s $f{{[a-z0-9]+}}, $f{{[a-z0-9]+}}
111+
// CHECK: #NO_APP
112+
check!(freg_f16, f16, freg, "fmov.s");
113+
102114
// CHECK-LABEL: freg_f32:
103115
// CHECK: #APP
104116
// CHECK: fmov.s $f{{[a-z0-9]+}}, $f{{[a-z0-9]+}}
@@ -123,6 +135,12 @@ check_reg!(r4_i8, i8, "$r4", "move");
123135
// CHECK: #NO_APP
124136
check_reg!(r4_i16, i16, "$r4", "move");
125137

138+
// CHECK-LABEL: r4_f16:
139+
// CHECK: #APP
140+
// CHECK: move $a0, $a0
141+
// CHECK: #NO_APP
142+
check_reg!(r4_f16, f16, "$r4", "move");
143+
126144
// CHECK-LABEL: r4_i32:
127145
// CHECK: #APP
128146
// CHECK: move $a0, $a0
@@ -153,6 +171,12 @@ check_reg!(r4_f64, f64, "$r4", "move");
153171
// CHECK: #NO_APP
154172
check_reg!(r4_ptr, ptr, "$r4", "move");
155173

174+
// CHECK-LABEL: f0_f16:
175+
// CHECK: #APP
176+
// CHECK: fmov.s $f{{[a-z0-9]+}}, $f{{[a-z0-9]+}}
177+
// CHECK: #NO_APP
178+
check_reg!(f0_f16, f16, "$f0", "fmov.s");
179+
156180
// CHECK-LABEL: f0_f32:
157181
// CHECK: #APP
158182
// CHECK: fmov.s $f{{[a-z0-9]+}}, $f{{[a-z0-9]+}}

0 commit comments

Comments
 (0)