diff --git a/library/src/amd_detail/rocblaslt/src/rocblaslt_mat.cpp b/library/src/amd_detail/rocblaslt/src/rocblaslt_mat.cpp index 9ed4053b78..2f55f56e8a 100644 --- a/library/src/amd_detail/rocblaslt/src/rocblaslt_mat.cpp +++ b/library/src/amd_detail/rocblaslt/src/rocblaslt_mat.cpp @@ -2,7 +2,7 @@ * * MIT License * - * Copyright (C) 2022-2024 Advanced Micro Devices, Inc. + * Copyright (C) 2022-2025 Advanced Micro Devices, Inc. * * Permission is hereby granted, free of charge, to any person obtaining a copy * of this software and associated documentation files (the "Software"), to deal @@ -28,6 +28,7 @@ #include "handle.h" #include "rocblaslt_mat_utils.hpp" #include "tensile_host.hpp" +#include #include @@ -376,24 +377,24 @@ rocblaslt_status hipDataType type_c = matC[0]->type; hipDataType type_d = matD[0]->type; - std::vector A_vec, B_vec, C_vec, alpha_vec, beta_vec; - std::vector D_vec, E_vec, amaxD_vec; - std::vector bias_vec; - std::vector scaleA_vec; - std::vector scaleB_vec; - std::vector scaleC_vec; - std::vector scaleD_vec; - std::vector scaleE_vec; - std::vector scaleAlpha_vec; - std::vector bias_type_vec; - std::vector epilogue_vec; - std::vector m_vec, n_vec, k_vec; - std::vector lda_vec, batch_stride_a_vec, num_batches_a_vec; - std::vector ldb_vec, batch_stride_b_vec, num_batches_b_vec; - std::vector ldc_vec, batch_stride_c_vec, num_batches_c_vec; - std::vector ldd_vec, batch_stride_d_vec, num_batches_d_vec; - std::vector lde_vec, batch_stride_e_vec, num_batches_e_vec; - std::vector alpha_1(matmul_descr.size()); + std::vector A_vec, B_vec, C_vec, alpha_vec, beta_vec; + std::vector D_vec, E_vec, amaxD_vec; + std::vector bias_vec; + std::vector scaleA_vec; + std::vector scaleB_vec; + std::vector scaleC_vec; + std::vector scaleD_vec; + std::vector scaleE_vec; + std::vector scaleAlpha_vec; + std::vector bias_type_vec; + std::vector epilogue_vec; + std::vector m_vec, n_vec, k_vec; + std::vector lda_vec, batch_stride_a_vec, num_batches_a_vec; + std::vector ldb_vec, batch_stride_b_vec, num_batches_b_vec; + std::vector ldc_vec, batch_stride_c_vec, num_batches_c_vec; + std::vector ldd_vec, batch_stride_d_vec, num_batches_d_vec; + std::vector lde_vec, batch_stride_e_vec, num_batches_e_vec; + std::vector> alpha_1(matmul_descr.size()); std::vector gradient_vec; @@ -493,10 +494,10 @@ rocblaslt_status return validArgs; const void* alphaTmp = nullptr; - memset(alpha_1[i], 0, sizeof(int8_t) * 16); + memset(alpha_1[i].data(), 0, sizeof(int8_t) * 16); if(scaleAlphaVec) { - setTo1(compute_type, (void*)alpha_1[i], &alphaTmp); + setTo1(compute_type, (void*)alpha_1[i].data(), &alphaTmp); } else { @@ -736,7 +737,8 @@ rocblaslt_status rocblaslt_matmul(rocblaslt_handle handle, "workSpaceSizeInBytes", workspaceSizeInBytes, (matmul_descr->pointermode) ? "alphaVector" : "alpha", - *(reinterpret_cast(alpha)), // TODO: Add casts for f16 and int types of alpha. + *(reinterpret_cast( + alpha)), // TODO: Add casts for f16 and int types of alpha. "beta", *(reinterpret_cast(beta)), "stream", @@ -1193,7 +1195,7 @@ rocblaslt_status rocblaslt_groupedgemm_create_cpp_impl_2(const rocblaslt_handle std::vector lde_vec, batch_stride_e_vec, num_batches_e_vec; std::vector gradient_vec; - std::vector alpha_1(m.size()); + std::vector> alpha_1(m.size()); for(int i = 0; i < m.size(); i++) { @@ -1287,10 +1289,10 @@ rocblaslt_status rocblaslt_groupedgemm_create_cpp_impl_2(const rocblaslt_handle return validArgs; const void* alphaTmp = nullptr; - memset(alpha_1[i], 0, sizeof(int8_t) * 16); + memset(alpha_1[i].data(), 0, sizeof(int8_t) * 16); if(scaleAlphaVec) { - setTo1(compute_type, (void*)alpha_1[i], &alphaTmp); + setTo1(compute_type, (void*)alpha_1[i].data(), &alphaTmp); } else {