Skip to content

Commit

Permalink
MLAS: update SGEMM threading parameters (#2808)
Browse files Browse the repository at this point in the history
  • Loading branch information
tracysh authored Jan 9, 2020
1 parent 71b5165 commit 7ef6570
Showing 1 changed file with 0 additions and 13 deletions.
13 changes: 0 additions & 13 deletions onnxruntime/core/mlas/lib/mlasi.h
Original file line number Diff line number Diff line change
Expand Up @@ -554,21 +554,8 @@ extern "C" {
// Define the target number of per-thread multiplies before using another
// thread to perform additional work.
//
// The number is derived from performance results running SGEMM across a
// range of workloads and observing the ideal number of threads to complete
// that workload.
//

#if defined(_OPENMP)
#define MLAS_SGEMM_THREAD_COMPLEXITY (64 * 1024)
#else
#if defined(MLAS_TARGET_AMD64)
#define MLAS_SGEMM_THREAD_COMPLEXITY (2 * 1024 * 1024)
#else
#define MLAS_SGEMM_THREAD_COMPLEXITY (1 * 1024 * 1024)
#endif
#endif

#define MLAS_DGEMM_THREAD_COMPLEXITY (64 * 1024)

//
Expand Down

0 comments on commit 7ef6570

Please sign in to comment.