Displaying 3 results from an estimated 3 matches for "float_literal".
2016 Mar 09
2
RFC: Proposing an LLVM subproject for parallelism runtime and support libraries
...he kernel adds a fixed floating point value to the input and writes
the
// result to the output location.
static constexpr const char *KERNEL_PTX = R"(
.version 3.1
.target sm_20
.address_size 64
.visible .entry add_mystery_value(
.param .f32 float_literal,
.param .u64 result_loc
) {
.reg .u64 %rl<2>;
.reg .f32 %f<2>;
ld.param.f32 %f1, [float_literal];
ld.param.u64 %rl1, [result_loc];
add.f32 %f1, %f1, 123.0;
st.f32 [%rl1], %f1;
ret;
}...
2016 Mar 09
2
RFC: Proposing an LLVM subproject for parallelism runtime and support libraries
...lue to the input and
> writes the
> // result to the output location.
> static constexpr const char *KERNEL_PTX = R"(
> .version 3.1
> .target sm_20
> .address_size 64
> .visible .entry add_mystery_value(
> .param .f32 float_literal,
> .param .u64 result_loc
> ) {
> .reg .u64 %rl<2>;
> .reg .f32 %f<2>;
> ld.param.f32 %f1, [float_literal];
> ld.param.u64 %rl1, [result_loc];
> add.f32 %f1, %f1, 123.0;
> st.f32...
2016 Mar 10
2
RFC: Proposing an LLVM subproject for parallelism runtime and support libraries
...ites the
>> // result to the output location.
>> static constexpr const char *KERNEL_PTX = R"(
>> .version 3.1
>> .target sm_20
>> .address_size 64
>> .visible .entry add_mystery_value(
>> .param .f32 float_literal,
>> .param .u64 result_loc
>> ) {
>> .reg .u64 %rl<2>;
>> .reg .f32 %f<2>;
>> ld.param.f32 %f1, [float_literal];
>> ld.param.u64 %rl1, [result_loc];
>> add.f32 %f1, %f1, 1...