Program Listing for File rocrand_uniform.h

Return to documentation for file (library/include/rocrand/rocrand_uniform.h)

// Copyright (c) 2017-2022 Advanced Micro Devices, Inc. All rights reserved.
//
// Permission is hereby granted, free of charge, to any person obtaining a copy
// of this software and associated documentation files (the "Software"), to deal
// in the Software without restriction, including without limitation the rights
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
// copies of the Software, and to permit persons to whom the Software is
// furnished to do so, subject to the following conditions:
//
// The above copyright notice and this permission notice shall be included in
// all copies or substantial portions of the Software.
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
// THE SOFTWARE.

#ifndef ROCRAND_UNIFORM_H_
#define ROCRAND_UNIFORM_H_

#ifndef FQUALIFIERS
#define FQUALIFIERS __forceinline__ __device__
#endif // FQUALIFIERS

#include "rocrand/rocrand_lfsr113.h"
#include "rocrand/rocrand_mrg31k3p.h"
#include "rocrand/rocrand_mrg32k3a.h"
#include "rocrand/rocrand_mtgp32.h"
#include "rocrand/rocrand_philox4x32_10.h"
#include "rocrand/rocrand_scrambled_sobol32.h"
#include "rocrand/rocrand_scrambled_sobol64.h"
#include "rocrand/rocrand_sobol32.h"
#include "rocrand/rocrand_sobol64.h"
#include "rocrand/rocrand_threefry2x32_20.h"
#include "rocrand/rocrand_threefry2x64_20.h"
#include "rocrand/rocrand_threefry4x32_20.h"
#include "rocrand/rocrand_threefry4x64_20.h"
#include "rocrand/rocrand_xorwow.h"

#include "rocrand/rocrand_common.h"

namespace rocrand_device {
namespace detail {

struct two_uints
{
    unsigned int x;
    unsigned int y;
};

union two_uints_to_ulong
{
    two_uints uint2_value;
    unsigned long long int ulong_value;
};

// For unsigned integer between 0 and UINT_MAX, returns value between
// 0.0f and 1.0f, excluding 0.0f and including 1.0f.
FQUALIFIERS
float uniform_distribution(unsigned int v)
{
    return ROCRAND_2POW32_INV + (v * ROCRAND_2POW32_INV);
}

// For unsigned integer between 0 and ULLONG_MAX, returns value between
// 0.0f and 1.0f, excluding 0.0f and including 1.0f.
FQUALIFIERS
float uniform_distribution(unsigned long long int v)
{
    return ROCRAND_2POW32_INV + (v >> 32) * ROCRAND_2POW32_INV;
}

FQUALIFIERS
float4 uniform_distribution4(uint4 v)
{
   return float4 {
       ROCRAND_2POW32_INV + (v.x * ROCRAND_2POW32_INV),
       ROCRAND_2POW32_INV + (v.y * ROCRAND_2POW32_INV),
       ROCRAND_2POW32_INV + (v.z * ROCRAND_2POW32_INV),
       ROCRAND_2POW32_INV + (v.w * ROCRAND_2POW32_INV)
   };
}

FQUALIFIERS float4 uniform_distribution4(ulonglong4 v)
{
    return float4{ROCRAND_2POW64_INV + (v.x * ROCRAND_2POW64_INV),
                  ROCRAND_2POW64_INV + (v.y * ROCRAND_2POW64_INV),
                  ROCRAND_2POW64_INV + (v.z * ROCRAND_2POW64_INV),
                  ROCRAND_2POW64_INV + (v.w * ROCRAND_2POW64_INV)};
}

// For unsigned integer between 0 and UINT_MAX, returns value between
// 0.0 and 1.0, excluding 0.0 and including 1.0.
FQUALIFIERS
double uniform_distribution_double(unsigned int v)
{
    return ROCRAND_2POW32_INV_DOUBLE + (v * ROCRAND_2POW32_INV_DOUBLE);
}

FQUALIFIERS
double uniform_distribution_double(unsigned int v1, unsigned int v2)
{
    two_uints_to_ulong v;
    v.uint2_value.x = v1;
    v.uint2_value.y = (v2 >> 11);
    return ROCRAND_2POW53_INV_DOUBLE + (v.ulong_value * ROCRAND_2POW53_INV_DOUBLE);
}

FQUALIFIERS
double uniform_distribution_double(unsigned long long int v)
{
    return ROCRAND_2POW53_INV_DOUBLE + (
        // 2^53 is the biggest int that can be stored in double, such
        // that it and all smaller integers can be stored in double
        (v >> 11) * ROCRAND_2POW53_INV_DOUBLE
    );
}

FQUALIFIERS
double2 uniform_distribution_double2(uint4 v)
{
    return double2 {
        uniform_distribution_double(v.x, v.y),
        uniform_distribution_double(v.z, v.w)
    };
}

FQUALIFIERS
double4 uniform_distribution_double4(uint4 v1, uint4 v2)
{
    return double4 {
        uniform_distribution_double(v1.x, v1.y),
        uniform_distribution_double(v1.z, v1.w),
        uniform_distribution_double(v2.x, v2.y),
        uniform_distribution_double(v2.z, v2.w)
    };
}

FQUALIFIERS double2 uniform_distribution_double2(ulonglong2 v)
{
    return double2{uniform_distribution_double(v.x), uniform_distribution_double(v.y)};
}

FQUALIFIERS double2 uniform_distribution_double2(ulonglong4 v)
{
    return double2{uniform_distribution_double(v.x), uniform_distribution_double(v.y)};
}

FQUALIFIERS double4 uniform_distribution_double4(ulonglong4 v)
{
    return double4{uniform_distribution_double(v.x),
                   uniform_distribution_double(v.z),
                   uniform_distribution_double(v.x),
                   uniform_distribution_double(v.z)};
}

FQUALIFIERS
__half uniform_distribution_half(unsigned short v)
{
    return __float2half(ROCRAND_2POW16_INV + (v * ROCRAND_2POW16_INV));
}

// For an unsigned integer produced by an MRG-based engine, returns a value
// in range [0, UINT32_MAX].
template<typename state_type>
FQUALIFIERS unsigned int mrg_uniform_distribution_uint(unsigned int v) = delete;

template<>
FQUALIFIERS unsigned int mrg_uniform_distribution_uint<rocrand_state_mrg31k3p>(unsigned int v)
{
    return static_cast<unsigned int>((v - 1) * ROCRAND_MRG31K3P_UINT32_NORM);
}

template<>
FQUALIFIERS unsigned int mrg_uniform_distribution_uint<rocrand_state_mrg32k3a>(unsigned int v)
{
    return static_cast<unsigned int>((v - 1) * ROCRAND_MRG32K3A_UINT_NORM);
}

// For an unsigned integer produced by an MRG-based engine, returns value between
// 0.0f and 1.0f, excluding 0.0f and including 1.0f.
template<typename state_type>
FQUALIFIERS float mrg_uniform_distribution(unsigned int v) = delete;

template<>
FQUALIFIERS float mrg_uniform_distribution<rocrand_state_mrg31k3p>(unsigned int v)
{
    double ret = static_cast<double>(v) * ROCRAND_MRG31K3P_NORM_DOUBLE;
    return static_cast<float>(ret);
}

template<>
FQUALIFIERS float mrg_uniform_distribution<rocrand_state_mrg32k3a>(unsigned int v)
{
    double ret = static_cast<double>(v) * ROCRAND_MRG32K3A_NORM_DOUBLE;
    return static_cast<float>(ret);
}

// For an unsigned integer produced by an MRG generator, returns value between
// 0.0 and 1.0, excluding 0.0 and including 1.0.
template<typename state_type>
FQUALIFIERS double mrg_uniform_distribution_double(unsigned int v) = delete;

template<>
FQUALIFIERS double mrg_uniform_distribution_double<rocrand_state_mrg31k3p>(unsigned int v)
{
    double ret = static_cast<double>(v) * ROCRAND_MRG31K3P_NORM_DOUBLE;
    return ret;
}

template<>
FQUALIFIERS double mrg_uniform_distribution_double<rocrand_state_mrg32k3a>(unsigned int v)
{
    double ret = static_cast<double>(v) * ROCRAND_MRG32K3A_NORM_DOUBLE;
    return ret;
}

} // end namespace detail
} // end namespace rocrand_device

FQUALIFIERS
float rocrand_uniform(rocrand_state_philox4x32_10 * state)
{
    return rocrand_device::detail::uniform_distribution(rocrand(state));
}

FQUALIFIERS
float2 rocrand_uniform2(rocrand_state_philox4x32_10 * state)
{
    auto state1 = rocrand(state);
    auto state2 = rocrand(state);

    return float2 {
        rocrand_device::detail::uniform_distribution(state1),
        rocrand_device::detail::uniform_distribution(state2)
    };
}

FQUALIFIERS
float4 rocrand_uniform4(rocrand_state_philox4x32_10 * state)
{
    return rocrand_device::detail::uniform_distribution4(rocrand4(state));
}

FQUALIFIERS
double rocrand_uniform_double(rocrand_state_philox4x32_10 * state)
{
    auto state1 = rocrand(state);
    auto state2 = rocrand(state);

    return rocrand_device::detail::uniform_distribution_double(state1, state2);
}

FQUALIFIERS
double2 rocrand_uniform_double2(rocrand_state_philox4x32_10 * state)
{
    return rocrand_device::detail::uniform_distribution_double2(rocrand4(state));
}

FQUALIFIERS
double4 rocrand_uniform_double4(rocrand_state_philox4x32_10 * state)
{
    return rocrand_device::detail::uniform_distribution_double4(rocrand4(state), rocrand4(state));
}

FQUALIFIERS float rocrand_uniform(rocrand_state_mrg31k3p* state)
{
    return rocrand_device::detail::mrg_uniform_distribution<rocrand_state_mrg31k3p>(state->next());
}

FQUALIFIERS double rocrand_uniform_double(rocrand_state_mrg31k3p* state)
{
    return rocrand_device::detail::mrg_uniform_distribution_double<rocrand_state_mrg31k3p>(
        state->next());
}

FQUALIFIERS
float rocrand_uniform(rocrand_state_mrg32k3a * state)
{
    return rocrand_device::detail::mrg_uniform_distribution<rocrand_state_mrg32k3a>(state->next());
}

FQUALIFIERS
double rocrand_uniform_double(rocrand_state_mrg32k3a * state)
{
    return rocrand_device::detail::mrg_uniform_distribution_double<rocrand_state_mrg32k3a>(
        state->next());
}

FQUALIFIERS
float rocrand_uniform(rocrand_state_xorwow * state)
{
    return rocrand_device::detail::uniform_distribution(rocrand(state));
}

FQUALIFIERS
double rocrand_uniform_double(rocrand_state_xorwow * state)
{
    auto state1 = rocrand(state);
    auto state2 = rocrand(state);

    return rocrand_device::detail::uniform_distribution_double(state1, state2);
}

FQUALIFIERS
float rocrand_uniform(rocrand_state_mtgp32 * state)
{
    return rocrand_device::detail::uniform_distribution(rocrand(state));
}

FQUALIFIERS
double rocrand_uniform_double(rocrand_state_mtgp32 * state)
{
    return rocrand_device::detail::uniform_distribution_double(rocrand(state));
}

FQUALIFIERS
float rocrand_uniform(rocrand_state_sobol32 * state)
{
    return rocrand_device::detail::uniform_distribution(rocrand(state));
}

FQUALIFIERS
double rocrand_uniform_double(rocrand_state_sobol32 * state)
{
    return rocrand_device::detail::uniform_distribution_double(rocrand(state));
}

FQUALIFIERS
float rocrand_uniform(rocrand_state_scrambled_sobol32* state)
{
    return rocrand_device::detail::uniform_distribution(rocrand(state));
}

FQUALIFIERS
double rocrand_uniform_double(rocrand_state_scrambled_sobol32* state)
{
    return rocrand_device::detail::uniform_distribution_double(rocrand(state));
}

FQUALIFIERS
float rocrand_uniform(rocrand_state_sobol64* state)
{
    return rocrand_device::detail::uniform_distribution(rocrand(state));
}

FQUALIFIERS
double rocrand_uniform_double(rocrand_state_sobol64 * state)
{
    return rocrand_device::detail::uniform_distribution_double(rocrand(state));
}

FQUALIFIERS
float rocrand_uniform(rocrand_state_scrambled_sobol64* state)
{
    return rocrand_device::detail::uniform_distribution(rocrand(state));
}

FQUALIFIERS
double rocrand_uniform_double(rocrand_state_scrambled_sobol64* state)
{
    return rocrand_device::detail::uniform_distribution_double(rocrand(state));
}

FQUALIFIERS
float rocrand_uniform(rocrand_state_lfsr113* state)
{
    return rocrand_device::detail::uniform_distribution(rocrand(state));
}

FQUALIFIERS
double rocrand_uniform_double(rocrand_state_lfsr113* state)
{
    return rocrand_device::detail::uniform_distribution_double(rocrand(state));
}

FQUALIFIERS float rocrand_uniform(rocrand_state_threefry2x32_20* state)
{
    return rocrand_device::detail::uniform_distribution(rocrand(state));
}

FQUALIFIERS double rocrand_uniform_double(rocrand_state_threefry2x32_20* state)
{
    return rocrand_device::detail::uniform_distribution_double(rocrand(state));
}

FQUALIFIERS float rocrand_uniform(rocrand_state_threefry2x64_20* state)
{
    return rocrand_device::detail::uniform_distribution(rocrand(state));
}

FQUALIFIERS double rocrand_uniform_double(rocrand_state_threefry2x64_20* state)
{
    return rocrand_device::detail::uniform_distribution_double(rocrand(state));
}

FQUALIFIERS float rocrand_uniform(rocrand_state_threefry4x32_20* state)
{
    return rocrand_device::detail::uniform_distribution(rocrand(state));
}

FQUALIFIERS double rocrand_uniform_double(rocrand_state_threefry4x32_20* state)
{
    return rocrand_device::detail::uniform_distribution_double(rocrand(state));
}

FQUALIFIERS float rocrand_uniform(rocrand_state_threefry4x64_20* state)
{
    return rocrand_device::detail::uniform_distribution(rocrand(state));
}

FQUALIFIERS double rocrand_uniform_double(rocrand_state_threefry4x64_20* state)
{
    return rocrand_device::detail::uniform_distribution_double(rocrand(state));
}

 // end of group rocranddevice
#endif // ROCRAND_UNIFORM_H_