mirror of
https://github.com/vosen/ZLUDA.git
synced 2025-07-18 17:56:22 +03:00
Implement negation
This commit is contained in:
@ -176,7 +176,7 @@ pub enum Instruction<P: ArgParams> {
|
|||||||
Add(AddDetails, Arg3<P>),
|
Add(AddDetails, Arg3<P>),
|
||||||
Setp(SetpData, Arg4<P>),
|
Setp(SetpData, Arg4<P>),
|
||||||
SetpBool(SetpBoolData, Arg5<P>),
|
SetpBool(SetpBoolData, Arg5<P>),
|
||||||
Not(NotData, Arg2<P>),
|
Not(NotType, Arg2<P>),
|
||||||
Bra(BraData, Arg1<P>),
|
Bra(BraData, Arg1<P>),
|
||||||
Cvt(CvtData, Arg2<P>),
|
Cvt(CvtData, Arg2<P>),
|
||||||
Shl(ShlData, Arg3<P>),
|
Shl(ShlData, Arg3<P>),
|
||||||
@ -386,7 +386,13 @@ pub struct SetpBoolData {
|
|||||||
pub bool_op: SetpBoolPostOp,
|
pub bool_op: SetpBoolPostOp,
|
||||||
}
|
}
|
||||||
|
|
||||||
pub struct NotData {}
|
#[derive(PartialEq, Eq, Copy, Clone)]
|
||||||
|
pub enum NotType {
|
||||||
|
Pred,
|
||||||
|
B16,
|
||||||
|
B32,
|
||||||
|
B64,
|
||||||
|
}
|
||||||
|
|
||||||
pub struct BraData {
|
pub struct BraData {
|
||||||
pub uniform: bool,
|
pub uniform: bool,
|
||||||
|
@ -557,11 +557,14 @@ SetpType: ast::ScalarType = {
|
|||||||
|
|
||||||
// https://docs.nvidia.com/cuda/parallel-thread-execution/index.html#logic-and-shift-instructions-not
|
// https://docs.nvidia.com/cuda/parallel-thread-execution/index.html#logic-and-shift-instructions-not
|
||||||
InstNot: ast::Instruction<ast::ParsedArgParams<'input>> = {
|
InstNot: ast::Instruction<ast::ParsedArgParams<'input>> = {
|
||||||
"not" NotType <a:Arg2> => ast::Instruction::Not(ast::NotData{}, a)
|
"not" <t:NotType> <a:Arg2> => ast::Instruction::Not(t, a)
|
||||||
};
|
};
|
||||||
|
|
||||||
NotType = {
|
NotType: ast::NotType = {
|
||||||
".pred", ".b16", ".b32", ".b64"
|
".pred" => ast::NotType::Pred,
|
||||||
|
".b16" => ast::NotType::B16,
|
||||||
|
".b32" => ast::NotType::B32,
|
||||||
|
".b64" => ast::NotType::B64,
|
||||||
};
|
};
|
||||||
|
|
||||||
// https://docs.nvidia.com/cuda/parallel-thread-execution/index.html#control-flow-instructions-at
|
// https://docs.nvidia.com/cuda/parallel-thread-execution/index.html#control-flow-instructions-at
|
||||||
|
@ -46,6 +46,7 @@ test_ptx!(mul_hi, [u64::max_value()], [1u64]);
|
|||||||
test_ptx!(add, [1u64], [2u64]);
|
test_ptx!(add, [1u64], [2u64]);
|
||||||
test_ptx!(setp, [10u64, 11u64], [1u64, 0u64]);
|
test_ptx!(setp, [10u64, 11u64], [1u64, 0u64]);
|
||||||
test_ptx!(bra, [10u64], [11u64]);
|
test_ptx!(bra, [10u64], [11u64]);
|
||||||
|
test_ptx!(not, [0u64], [u64::max_value()]);
|
||||||
|
|
||||||
struct DisplayError<T: Display + Debug> {
|
struct DisplayError<T: Display + Debug> {
|
||||||
err: T,
|
err: T,
|
||||||
|
22
ptx/src/test/spirv_run/not.ptx
Normal file
22
ptx/src/test/spirv_run/not.ptx
Normal file
@ -0,0 +1,22 @@
|
|||||||
|
.version 6.5
|
||||||
|
.target sm_30
|
||||||
|
.address_size 64
|
||||||
|
|
||||||
|
.visible .entry not(
|
||||||
|
.param .u64 input,
|
||||||
|
.param .u64 output
|
||||||
|
)
|
||||||
|
{
|
||||||
|
.reg .u64 in_addr;
|
||||||
|
.reg .u64 out_addr;
|
||||||
|
.reg .u64 temp;
|
||||||
|
.reg .u64 temp2;
|
||||||
|
|
||||||
|
ld.param.u64 in_addr, [input];
|
||||||
|
ld.param.u64 out_addr, [output];
|
||||||
|
|
||||||
|
ld.u64 temp, [in_addr];
|
||||||
|
not.b64 temp2, temp;
|
||||||
|
st.u64 [out_addr], temp2;
|
||||||
|
ret;
|
||||||
|
}
|
39
ptx/src/test/spirv_run/not.spvtxt
Normal file
39
ptx/src/test/spirv_run/not.spvtxt
Normal file
@ -0,0 +1,39 @@
|
|||||||
|
OpCapability GenericPointer
|
||||||
|
OpCapability Linkage
|
||||||
|
OpCapability Addresses
|
||||||
|
OpCapability Kernel
|
||||||
|
OpCapability Int64
|
||||||
|
OpCapability Int8
|
||||||
|
%1 = OpExtInstImport "OpenCL.std"
|
||||||
|
OpMemoryModel Physical64 OpenCL
|
||||||
|
OpEntryPoint Kernel %5 "not"
|
||||||
|
%void = OpTypeVoid
|
||||||
|
%ulong = OpTypeInt 64 0
|
||||||
|
%4 = OpTypeFunction %void %ulong %ulong
|
||||||
|
%_ptr_Function_ulong = OpTypePointer Function %ulong
|
||||||
|
%_ptr_Generic_ulong = OpTypePointer Generic %ulong
|
||||||
|
%ulong_0 = OpTypeInt 64 0
|
||||||
|
%5 = OpFunction %void None %4
|
||||||
|
%6 = OpFunctionParameter %ulong
|
||||||
|
%7 = OpFunctionParameter %ulong
|
||||||
|
%20 = OpLabel
|
||||||
|
%8 = OpVariable %_ptr_Function_ulong Function
|
||||||
|
%9 = OpVariable %_ptr_Function_ulong Function
|
||||||
|
%10 = OpVariable %_ptr_Function_ulong Function
|
||||||
|
%11 = OpVariable %_ptr_Function_ulong Function
|
||||||
|
OpStore %8 %6
|
||||||
|
OpStore %9 %7
|
||||||
|
%13 = OpLoad %ulong %8
|
||||||
|
%18 = OpConvertUToPtr %_ptr_Generic_ulong %13
|
||||||
|
%12 = OpLoad %ulong %18
|
||||||
|
OpStore %10 %12
|
||||||
|
%15 = OpLoad %ulong_0 %10
|
||||||
|
%14 = OpNot %ulong_0 %15
|
||||||
|
OpStore %11 %14
|
||||||
|
%16 = OpLoad %ulong %9
|
||||||
|
%17 = OpLoad %ulong %11
|
||||||
|
%19 = OpConvertUToPtr %_ptr_Generic_ulong %16
|
||||||
|
OpStore %19 %17
|
||||||
|
OpReturn
|
||||||
|
OpFunctionEnd
|
||||||
|
|
@ -659,6 +659,15 @@ fn emit_function_body_ops(
|
|||||||
}
|
}
|
||||||
emit_setp(builder, map, setp, arg)?;
|
emit_setp(builder, map, setp, arg)?;
|
||||||
}
|
}
|
||||||
|
ast::Instruction::Not(t, a) => {
|
||||||
|
let result_type = map.get_or_add(builder, SpirvType::from(t.to_type()));
|
||||||
|
let result_id = Some(a.dst);
|
||||||
|
let operand = a.src;
|
||||||
|
match t {
|
||||||
|
ast::NotType::Pred => builder.logical_not(result_type, result_id, operand),
|
||||||
|
_ => builder.not(result_type, result_id, operand),
|
||||||
|
}?;
|
||||||
|
}
|
||||||
_ => todo!(),
|
_ => todo!(),
|
||||||
},
|
},
|
||||||
Statement::LoadVar(arg, typ) => {
|
Statement::LoadVar(arg, typ) => {
|
||||||
@ -887,9 +896,7 @@ fn expand_map_variables<'a>(
|
|||||||
s: ast::Statement<ast::ParsedArgParams<'a>>,
|
s: ast::Statement<ast::ParsedArgParams<'a>>,
|
||||||
) {
|
) {
|
||||||
match s {
|
match s {
|
||||||
ast::Statement::Label(name) => {
|
ast::Statement::Label(name) => result.push(ast::Statement::Label(id_defs.get_id(name))),
|
||||||
result.push(ast::Statement::Label(id_defs.get_id(name)))
|
|
||||||
}
|
|
||||||
ast::Statement::Instruction(p, i) => result.push(ast::Statement::Instruction(
|
ast::Statement::Instruction(p, i) => result.push(ast::Statement::Instruction(
|
||||||
p.map(|p| p.map_variable(&mut |id| id_defs.get_id(id))),
|
p.map(|p| p.map_variable(&mut |id| id_defs.get_id(id))),
|
||||||
i.map_variable(&mut |id| id_defs.get_id(id)),
|
i.map_variable(&mut |id| id_defs.get_id(id)),
|
||||||
@ -1128,7 +1135,9 @@ impl<T: ast::ArgParams> ast::Instruction<T> {
|
|||||||
let inst_type = d.typ;
|
let inst_type = d.typ;
|
||||||
ast::Instruction::SetpBool(d, a.map(visitor, Some(ast::Type::Scalar(inst_type))))
|
ast::Instruction::SetpBool(d, a.map(visitor, Some(ast::Type::Scalar(inst_type))))
|
||||||
}
|
}
|
||||||
ast::Instruction::Not(_, _) => todo!(),
|
ast::Instruction::Not(t, a) => {
|
||||||
|
ast::Instruction::Not(t, a.map(visitor, Some(t.to_type())))
|
||||||
|
}
|
||||||
ast::Instruction::Cvt(_, _) => todo!(),
|
ast::Instruction::Cvt(_, _) => todo!(),
|
||||||
ast::Instruction::Shl(_, _) => todo!(),
|
ast::Instruction::Shl(_, _) => todo!(),
|
||||||
ast::Instruction::St(d, a) => {
|
ast::Instruction::St(d, a) => {
|
||||||
@ -1513,6 +1522,17 @@ impl ast::ScalarType {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
impl ast::NotType {
|
||||||
|
fn to_type(self) -> ast::Type {
|
||||||
|
match self {
|
||||||
|
ast::NotType::Pred => ast::Type::ExtendedScalar(ast::ExtendedScalarType::Pred),
|
||||||
|
ast::NotType::B16 => ast::Type::Scalar(ast::ScalarType::B16),
|
||||||
|
ast::NotType::B32 => ast::Type::Scalar(ast::ScalarType::B32),
|
||||||
|
ast::NotType::B64 => ast::Type::Scalar(ast::ScalarType::B64),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
impl ast::AddDetails {
|
impl ast::AddDetails {
|
||||||
fn get_type(&self) -> ast::Type {
|
fn get_type(&self) -> ast::Type {
|
||||||
match self {
|
match self {
|
||||||
|
Reference in New Issue
Block a user