revert format change

This commit is contained in:
luoyu-intel 2024-06-19 08:22:02 +00:00
parent 5de2122647
commit e1eabdc2e4

View file

@ -220,8 +220,7 @@ namespace dpct
// a. and b. // a. and b.
i++; i++;
minor = std::stoi(&(ver[i])); minor = std::stoi(&(ver[i]));
} } else {
else {
// c. // c.
minor = 0; minor = 0;
} }
@ -232,7 +231,7 @@ namespace dpct
{ {
public: public:
generic_error_type() = default; generic_error_type() = default;
generic_error_type(T value) : value{ value } {} generic_error_type(T value) : value{value} {}
operator T() const { return value; } operator T() const { return value; }
private: private:
@ -577,7 +576,7 @@ namespace dpct
prop.set_max_work_items_per_compute_unit( prop.set_max_work_items_per_compute_unit(
dev.get_info<sycl::info::device::max_work_group_size>()); dev.get_info<sycl::info::device::max_work_group_size>());
int max_nd_range_size[] = { 0x7FFFFFFF, 0x7FFFFFFF, 0x7FFFFFFF }; int max_nd_range_size[] = {0x7FFFFFFF, 0x7FFFFFFF, 0x7FFFFFFF};
prop.set_max_nd_range_size(max_nd_range_size); prop.set_max_nd_range_size(max_nd_range_size);
// Estimates max register size per work group, feel free to update the value // Estimates max register size per work group, feel free to update the value
@ -590,94 +589,75 @@ namespace dpct
} }
/// dpct device extension /// dpct device extension
class device_ext : public sycl::device class device_ext : public sycl::device {
{
typedef std::mutex mutex_type; typedef std::mutex mutex_type;
public: public:
device_ext() : sycl::device() {} device_ext() : sycl::device() {}
~device_ext() ~device_ext() {
{
std::lock_guard<mutex_type> lock(m_mutex); std::lock_guard<mutex_type> lock(m_mutex);
clear_queues(); clear_queues();
} }
device_ext(const sycl::device &base) : sycl::device(base) device_ext(const sycl::device &base) : sycl::device(base) {
{
std::lock_guard<mutex_type> lock(m_mutex); std::lock_guard<mutex_type> lock(m_mutex);
init_queues(); init_queues();
} }
int is_native_atomic_supported() { return 0; } int is_native_atomic_supported() { return 0; }
int get_major_version() const int get_major_version() const { return dpct::get_major_version(*this); }
{
return dpct::get_major_version(*this);
}
int get_minor_version() const int get_minor_version() const { return dpct::get_minor_version(*this); }
{
return dpct::get_minor_version(*this);
}
int get_max_compute_units() const int get_max_compute_units() const {
{
return get_device_info().get_max_compute_units(); return get_device_info().get_max_compute_units();
} }
/// Return the maximum clock frequency of this device in KHz. /// Return the maximum clock frequency of this device in KHz.
int get_max_clock_frequency() const int get_max_clock_frequency() const {
{
return get_device_info().get_max_clock_frequency(); return get_device_info().get_max_clock_frequency();
} }
int get_integrated() const { return get_device_info().get_integrated(); } int get_integrated() const { return get_device_info().get_integrated(); }
int get_max_sub_group_size() const int get_max_sub_group_size() const {
{
return get_device_info().get_max_sub_group_size(); return get_device_info().get_max_sub_group_size();
} }
int get_max_register_size_per_work_group() const int get_max_register_size_per_work_group() const {
{
return get_device_info().get_max_register_size_per_work_group(); return get_device_info().get_max_register_size_per_work_group();
} }
int get_max_work_group_size() const int get_max_work_group_size() const {
{
return get_device_info().get_max_work_group_size(); return get_device_info().get_max_work_group_size();
} }
int get_mem_base_addr_align() const int get_mem_base_addr_align() const {
{
return get_info<sycl::info::device::mem_base_addr_align>(); return get_info<sycl::info::device::mem_base_addr_align>();
} }
size_t get_global_mem_size() const size_t get_global_mem_size() const {
{
return get_device_info().get_global_mem_size(); return get_device_info().get_global_mem_size();
} }
size_t get_max_mem_alloc_size() const size_t get_max_mem_alloc_size() const {
{
return get_device_info().get_max_mem_alloc_size(); return get_device_info().get_max_mem_alloc_size();
} }
/// Get the number of bytes of free and total memory on the SYCL device. /// Get the number of bytes of free and total memory on the SYCL device.
/// \param [out] free_memory The number of bytes of free memory on the SYCL device. /// \param [out] free_memory The number of bytes of free memory on the
/// \param [out] total_memory The number of bytes of total memory on the SYCL device. /// SYCL device. \param [out] total_memory The number of bytes of total
void get_memory_info(size_t &free_memory, size_t &total_memory) /// memory on the SYCL device.
{ void get_memory_info(size_t &free_memory, size_t &total_memory) {
total_memory = get_device_info().get_global_mem_size(); total_memory = get_device_info().get_global_mem_size();
const char *warning_info = "get_memory_info: [warning] ext_intel_free_memory is not " const char *warning_info =
"get_memory_info: [warning] ext_intel_free_memory is not "
"supported (export/set ZES_ENABLE_SYSMAN=1 to support), " "supported (export/set ZES_ENABLE_SYSMAN=1 to support), "
"use total memory as free memory"; "use total memory as free memory";
#if (defined(__SYCL_COMPILER_VERSION) && __SYCL_COMPILER_VERSION >= 20221105) #if (defined(__SYCL_COMPILER_VERSION) && __SYCL_COMPILER_VERSION >= 20221105)
if (!has(sycl::aspect::ext_intel_free_memory)) if (!has(sycl::aspect::ext_intel_free_memory)) {
{
std::cerr << warning_info << std::endl; std::cerr << warning_info << std::endl;
free_memory = total_memory; free_memory = total_memory;
} } else {
else
{
free_memory = get_info<sycl::ext::intel::info::device::free_memory>(); free_memory = get_info<sycl::ext::intel::info::device::free_memory>();
} }
#else #else
@ -691,20 +671,17 @@ namespace dpct
#endif #endif
} }
void get_device_info(device_info &out) const void get_device_info(device_info &out) const {
{
dpct::get_device_info(out, *this); dpct::get_device_info(out, *this);
} }
device_info get_device_info() const device_info get_device_info() const {
{
device_info prop; device_info prop;
dpct::get_device_info(prop, *this); dpct::get_device_info(prop, *this);
return prop; return prop;
} }
void reset() void reset() {
{
std::lock_guard<mutex_type> lock(m_mutex); std::lock_guard<mutex_type> lock(m_mutex);
clear_queues(); clear_queues();
init_queues(); init_queues();
@ -714,25 +691,20 @@ namespace dpct
sycl::queue &out_of_order_queue() { return _q_out_of_order; } sycl::queue &out_of_order_queue() { return _q_out_of_order; }
sycl::queue &default_queue() sycl::queue &default_queue() { return in_order_queue(); }
{
return in_order_queue();
}
void queues_wait_and_throw() void queues_wait_and_throw() {
{
std::unique_lock<mutex_type> lock(m_mutex); std::unique_lock<mutex_type> lock(m_mutex);
lock.unlock(); lock.unlock();
for (auto &q : _queues) for (auto &q : _queues) {
{
q.wait_and_throw(); q.wait_and_throw();
} }
// Guard the destruct of current_queues to make sure the ref count is safe. // Guard the destruct of current_queues to make sure the ref count is
// safe.
lock.lock(); lock.lock();
} }
sycl::queue create_queue(bool enable_exception_handler = false) sycl::queue create_queue(bool enable_exception_handler = false) {
{
return create_in_order_queue(enable_exception_handler); return create_in_order_queue(enable_exception_handler);
} }
@ -754,52 +726,45 @@ namespace dpct
sycl::property::queue::in_order()); sycl::property::queue::in_order());
} }
sycl::queue create_out_of_order_queue(bool enable_exception_handler = false) { sycl::queue create_out_of_order_queue(
bool enable_exception_handler = false) {
std::lock_guard<mutex_type> lock(m_mutex); std::lock_guard<mutex_type> lock(m_mutex);
return create_queue_impl(enable_exception_handler); return create_queue_impl(enable_exception_handler);
} }
void destroy_queue(sycl::queue queue) void destroy_queue(sycl::queue queue) {
{
std::lock_guard<mutex_type> lock(m_mutex); std::lock_guard<mutex_type> lock(m_mutex);
_queues.clear(); _queues.clear();
} }
void set_saved_queue(sycl::queue q) void set_saved_queue(sycl::queue q) {
{
std::lock_guard<mutex_type> lock(m_mutex); std::lock_guard<mutex_type> lock(m_mutex);
_saved_queue = q; _saved_queue = q;
} }
sycl::queue get_saved_queue() const sycl::queue get_saved_queue() const {
{
std::lock_guard<mutex_type> lock(m_mutex); std::lock_guard<mutex_type> lock(m_mutex);
return _saved_queue; return _saved_queue;
} }
private: private:
void clear_queues() void clear_queues() { _queues.clear(); }
{
_queues.clear();
}
void init_queues() void init_queues() {
{ _q_in_order =
_q_in_order = create_queue_impl(true, sycl::property::queue::in_order()); create_queue_impl(true, sycl::property::queue::in_order());
_q_out_of_order = create_queue_impl(true); _q_out_of_order = create_queue_impl(true);
_saved_queue = default_queue(); _saved_queue = default_queue();
} }
/// Caller should acquire resource \p m_mutex before calling this function. /// Caller should acquire resource \p m_mutex before calling this
/// function.
template <class... Properties> template <class... Properties>
sycl::queue create_queue_impl(bool enable_exception_handler, sycl::queue create_queue_impl(bool enable_exception_handler,
Properties... properties) Properties... properties) {
{
sycl::async_handler eh = {}; sycl::async_handler eh = {};
if (enable_exception_handler) if (enable_exception_handler) {
{
eh = exception_handler; eh = exception_handler;
} }
auto q = sycl::queue( auto q = sycl::queue(*this, eh,
*this, eh,
sycl::property_list( sycl::property_list(
#ifdef DPCT_PROFILING_ENABLED #ifdef DPCT_PROFILING_ENABLED
sycl::property::queue::enable_profiling(), sycl::property::queue::enable_profiling(),
@ -818,8 +783,8 @@ namespace dpct
if (enable_exception_handler) { if (enable_exception_handler) {
eh = exception_handler; eh = exception_handler;
} }
_queues.push_back(sycl::queue( _queues.push_back(
device, eh, sycl::queue(device, eh,
sycl::property_list( sycl::property_list(
#ifdef DPCT_PROFILING_ENABLED #ifdef DPCT_PROFILING_ENABLED
sycl::property::queue::enable_profiling(), sycl::property::queue::enable_profiling(),
@ -829,8 +794,7 @@ namespace dpct
return _queues.back(); return _queues.back();
} }
void get_version(int &major, int &minor) const void get_version(int &major, int &minor) const {
{
detail::get_version(*this, major, minor); detail::get_version(*this, major, minor);
} }
sycl::queue _q_in_order, _q_out_of_order; sycl::queue _q_in_order, _q_out_of_order;
@ -929,15 +893,15 @@ namespace dpct
sycl::backend backend1 = device1.get_backend(); sycl::backend backend1 = device1.get_backend();
sycl::backend backend2 = device2.get_backend(); sycl::backend backend2 = device2.get_backend();
// levelzero backends always come first // levelzero backends always come first
if (backend1 == sycl::backend::ext_oneapi_level_zero && backend2 != sycl::backend::ext_oneapi_level_zero) return true; if(backend1 == sycl::backend::ext_oneapi_level_zero && backend2 != sycl::backend::ext_oneapi_level_zero) return true;
if (backend1 != sycl::backend::ext_oneapi_level_zero && backend2 == sycl::backend::ext_oneapi_level_zero) return false; if(backend1 != sycl::backend::ext_oneapi_level_zero && backend2 == sycl::backend::ext_oneapi_level_zero) return false;
dpct::device_info prop1; dpct::device_info prop1;
dpct::get_device_info(prop1, device1); dpct::get_device_info(prop1, device1);
dpct::device_info prop2; dpct::device_info prop2;
dpct::get_device_info(prop2, device2); dpct::get_device_info(prop2, device2);
return prop1.get_max_compute_units() > prop2.get_max_compute_units(); return prop1.get_max_compute_units() > prop2.get_max_compute_units();
} }
static int convert_backend_index(std::string &backend) { static int convert_backend_index(std::string & backend) {
if (backend == "ext_oneapi_level_zero:gpu") return 0; if (backend == "ext_oneapi_level_zero:gpu") return 0;
if (backend == "opencl:gpu") return 1; if (backend == "opencl:gpu") return 1;
if (backend == "ext_oneapi_cuda:gpu") return 2; if (backend == "ext_oneapi_cuda:gpu") return 2;
@ -977,7 +941,7 @@ namespace dpct
} }
std::vector<std::string> keys; std::vector<std::string> keys;
for (auto it = backend_devices.begin(); it != backend_devices.end(); ++it) { for(auto it = backend_devices.begin(); it != backend_devices.end(); ++it) {
keys.push_back(it->first); keys.push_back(it->first);
} }
std::sort(keys.begin(), keys.end(), compare_backend); std::sort(keys.begin(), keys.end(), compare_backend);
@ -1132,7 +1096,7 @@ namespace dpct
// Allocation // Allocation
sycl::range<1> r(size); sycl::range<1> r(size);
buffer_t buf(r); buffer_t buf(r);
allocation A{ buf, next_free, size }; allocation A{buf, next_free, size};
// Map allocation to device pointer // Map allocation to device pointer
void *result = next_free; void *result = next_free;
m_map.emplace(next_free + size, A); m_map.emplace(next_free + size, A);
@ -1324,7 +1288,7 @@ namespace dpct
static const memcpy_direction static const memcpy_direction
direction_table[static_cast<unsigned>(pointer_access_attribute::end)] direction_table[static_cast<unsigned>(pointer_access_attribute::end)]
[static_cast<unsigned>(pointer_access_attribute::end)] = [static_cast<unsigned>(pointer_access_attribute::end)] =
{ {memcpy_direction::host_to_host, {{memcpy_direction::host_to_host,
memcpy_direction::device_to_host, memcpy_direction::device_to_host,
memcpy_direction::host_to_host}, memcpy_direction::host_to_host},
{memcpy_direction::host_to_device, {memcpy_direction::host_to_device,
@ -1332,7 +1296,7 @@ namespace dpct
memcpy_direction::device_to_device}, memcpy_direction::device_to_device},
{memcpy_direction::host_to_host, {memcpy_direction::host_to_host,
memcpy_direction::device_to_device, memcpy_direction::device_to_device,
memcpy_direction::device_to_device} }; memcpy_direction::device_to_device}};
return direction_table[static_cast<unsigned>(get_pointer_attribute( return direction_table[static_cast<unsigned>(get_pointer_attribute(
q, to_ptr))][static_cast<unsigned>(get_pointer_attribute(q, from_ptr))]; q, to_ptr))][static_cast<unsigned>(get_pointer_attribute(q, from_ptr))];
} }
@ -1411,8 +1375,8 @@ namespace dpct
if (to_slice == from_slice && to_slice == size.get(1) * size.get(0)) if (to_slice == from_slice && to_slice == size.get(1) * size.get(0))
{ {
return { dpct_memcpy(q, to_surface, from_surface, to_slice * size.get(2), return {dpct_memcpy(q, to_surface, from_surface, to_slice * size.get(2),
direction, dep_events) }; direction, dep_events)};
} }
direction = deduce_memcpy_direction(q, to_ptr, from_ptr, direction); direction = deduce_memcpy_direction(q, to_ptr, from_ptr, direction);
size_t size_slice = size.get(1) * size.get(0); size_t size_slice = size.get(1) * size.get(0);
@ -1489,7 +1453,7 @@ namespace dpct
break; break;
} }
case device_to_device: case device_to_device:
event_list.push_back(q.submit([&](sycl::handler &cgh) { event_list.push_back(q.submit([&](sycl::handler &cgh){
cgh.depends_on(dep_events); cgh.depends_on(dep_events);
cgh.parallel_for<class dpct_memcpy_3d_detail>( cgh.parallel_for<class dpct_memcpy_3d_detail>(
size, size,
@ -1746,7 +1710,7 @@ namespace dpct
inline unsigned vectorized_binary(unsigned a, unsigned b, inline unsigned vectorized_binary(unsigned a, unsigned b,
const BinaryOperation binary_op) const BinaryOperation binary_op)
{ {
sycl::vec<unsigned, 1> v0{ a }, v1{ b }; sycl::vec<unsigned, 1> v0{a}, v1{b};
auto v2 = v0.as<VecT>(); auto v2 = v0.as<VecT>();
auto v3 = v1.as<VecT>(); auto v3 = v1.as<VecT>();
auto v4 = auto v4 =
@ -1793,7 +1757,7 @@ namespace dpct
template <typename T1, typename T2> template <typename T1, typename T2>
using dot_product_acc_t = using dot_product_acc_t =
std::conditional_t<std::is_unsigned_v<T1> &&std::is_unsigned_v<T2>, std::conditional_t<std::is_unsigned_v<T1> && std::is_unsigned_v<T2>,
uint32_t, int32_t>; uint32_t, int32_t>;
template <typename T1, typename T2, typename T3> template <typename T1, typename T2, typename T3>
@ -1821,7 +1785,7 @@ namespace dpct
template <typename S, typename T> template <typename S, typename T>
inline T vectorized_min(T a, T b) inline T vectorized_min(T a, T b)
{ {
sycl::vec<T, 1> v0{ a }, v1{ b }; sycl::vec<T, 1> v0{a}, v1{b};
auto v2 = v0.template as<S>(); auto v2 = v0.template as<S>();
auto v3 = v1.template as<S>(); auto v3 = v1.template as<S>();
auto v4 = sycl::min(v2, v3); auto v4 = sycl::min(v2, v3);
@ -2099,8 +2063,8 @@ namespace dpct
if (to_slice == from_slice && to_slice == size.get(1) * size.get(0)) if (to_slice == from_slice && to_slice == size.get(1) * size.get(0))
{ {
return { dpct_memcpy(q, to_surface, from_surface, to_slice * size.get(2), return {dpct_memcpy(q, to_surface, from_surface, to_slice * size.get(2),
direction, dep_events) }; direction, dep_events)};
} }
direction = detail::deduce_memcpy_direction(q, to_ptr, from_ptr, direction); direction = detail::deduce_memcpy_direction(q, to_ptr, from_ptr, direction);
size_t size_slice = size.get(1) * size.get(0); size_t size_slice = size.get(1) * size.get(0);
@ -2900,7 +2864,7 @@ namespace dpct
typename detail::memory_traits<Memory, T>::template accessor_t<0>; typename detail::memory_traits<Memory, T>::template accessor_t<0>;
/// Constructor with initial value. /// Constructor with initial value.
device_memory(const value_t &val) : base(sycl::range<1>(1), { val }) {} device_memory(const value_t &val) : base(sycl::range<1>(1), {val}) {}
/// Default constructor /// Default constructor
device_memory() : base(1) {} device_memory() : base(1) {}