@@ -98,7 +98,7 @@ def speedupk(df: pd.DataFrame, k: int, n: int) -> pd.DataFrame:
98
98
(df ["parallelism_model" ] == "cuda" ) |
99
99
(df ["parallelism_model" ] == "hip" ) |
100
100
((df ["parallelism_model" ] == "kokkos" ) & (df ["num_threads" ] == 32 )) |
101
- ((df ["parallelism_model" ] == "omp" ) & (df ["num_threads" ] == 64 )) |
101
+ ((df ["parallelism_model" ] == "omp" ) & (df ["num_threads" ] == 32 )) |
102
102
((df ["parallelism_model" ] == "mpi" ) & (df ["num_procs" ] == 512 )) |
103
103
((df ["parallelism_model" ] == "mpi+omp" ) & (df ["num_procs" ] == 4 ) & (df ["num_threads" ] == 64 ))]
104
104
df = df .copy ()
@@ -153,17 +153,17 @@ def efficiencyk(df: pd.DataFrame, k: int, n: int) -> pd.DataFrame:
153
153
(df ["parallelism_model" ] == "cuda" ) |
154
154
(df ["parallelism_model" ] == "hip" ) |
155
155
((df ["parallelism_model" ] == "kokkos" ) & (df ["num_threads" ] == 32 )) |
156
- ((df ["parallelism_model" ] == "omp" ) & (df ["num_threads" ] == 64 )) |
156
+ ((df ["parallelism_model" ] == "omp" ) & (df ["num_threads" ] == 32 )) |
157
157
((df ["parallelism_model" ] == "mpi" ) & (df ["num_procs" ] == 512 )) |
158
158
((df ["parallelism_model" ] == "mpi+omp" ) & (df ["num_procs" ] == 4 ) & (df ["num_threads" ] == 64 ))]
159
159
160
- # set n_resources column to 1 for serial; 32 for kokkos; 64 for omp; 512 for mpi; 4*64 for mpi+omp;
160
+ # set n_resources column to 1 for serial; 32 for kokkos; 32 for omp; 512 for mpi; 4*64 for mpi+omp;
161
161
# set it to problem_size for cuda and hip
162
162
df ["n_resources" ] = 1
163
163
df .loc [df ["parallelism_model" ] == "cuda" , "n_resources" ] = df ["problem_size" ]
164
164
df .loc [df ["parallelism_model" ] == "hip" , "n_resources" ] = df ["problem_size" ]
165
165
df .loc [df ["parallelism_model" ] == "kokkos" , "n_resources" ] = 32
166
- df .loc [df ["parallelism_model" ] == "omp" , "n_resources" ] = 64
166
+ df .loc [df ["parallelism_model" ] == "omp" , "n_resources" ] = 32
167
167
df .loc [df ["parallelism_model" ] == "mpi" , "n_resources" ] = 512
168
168
df .loc [df ["parallelism_model" ] == "mpi+omp" , "n_resources" ] = 4 * 64
169
169
0 commit comments