From c2323afed50a123fede0e2157c07ec7142af2225 Mon Sep 17 00:00:00 2001 From: Ahsan Saghir Date: Thu, 30 Jan 2025 01:13:56 +0000 Subject: [PATCH 1/2] Fix rocBLAS failure --- src/targets/gpu/fuse_ops.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/targets/gpu/fuse_ops.cpp b/src/targets/gpu/fuse_ops.cpp index 5e93ccf5ecf..458762eec92 100644 --- a/src/targets/gpu/fuse_ops.cpp +++ b/src/targets/gpu/fuse_ops.cpp @@ -677,7 +677,7 @@ struct find_rocblas_gemm_pointwise : gemm_pointwise shape s = c_ins->get_shape(); // const-fold input if not standard shape since rocblas can't handle it // Updated for a case where "standard" shape has out-of-sequence strides - if(not s.standard()) + if(not s.standard() or s.normalize_standard() != s) { auto c = make_op("contiguous"); auto l = c.compute(c.compute_shape({c_ins->get_shape()}), {c_ins->eval()}); From a3b4d0c118b412b1364d50d892f35a6aef2d415f Mon Sep 17 00:00:00 2001 From: Ahsan Saghir Date: Thu, 30 Jan 2025 20:21:04 +0000 Subject: [PATCH 2/2] Update copyright year for license check --- src/targets/gpu/fuse_ops.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/targets/gpu/fuse_ops.cpp b/src/targets/gpu/fuse_ops.cpp index 458762eec92..91f08a7fdd8 100644 --- a/src/targets/gpu/fuse_ops.cpp +++ b/src/targets/gpu/fuse_ops.cpp @@ -1,7 +1,7 @@ /* * The MIT License (MIT) * - * Copyright (c) 2015-2024 Advanced Micro Devices, Inc. All rights reserved. + * Copyright (c) 2015-2025 Advanced Micro Devices, Inc. All rights reserved. * * Permission is hereby granted, free of charge, to any person obtaining a copy * of this software and associated documentation files (the "Software"), to deal