From 9f767fb80a4fea83c6b767834ee3f76fe9898c50 Mon Sep 17 00:00:00 2001 From: Ahmad Alawneh Date: Sun, 7 Sep 2025 18:19:27 -0400 Subject: [PATCH 1/2] Update gpgpusim.config --- configs/tested-cfgs/SM80_A100/gpgpusim.config | 17 ++++++++--------- 1 file changed, 8 insertions(+), 9 deletions(-) diff --git a/configs/tested-cfgs/SM80_A100/gpgpusim.config b/configs/tested-cfgs/SM80_A100/gpgpusim.config index 35f6d18ed..37b6b772d 100644 --- a/configs/tested-cfgs/SM80_A100/gpgpusim.config +++ b/configs/tested-cfgs/SM80_A100/gpgpusim.config @@ -8,9 +8,8 @@ -gpgpu_heap_size_limit 8388608 -gpgpu_runtime_sync_depth_limit 2 -gpgpu_runtime_pending_launch_count_limit 2048 --gpgpu_kernel_launch_latency 5000 +-gpgpu_kernel_launch_latency 5000 -gpgpu_TB_launch_latency 0 --gpgpu_max_concurrent_kernel 128 # Compute Capability -gpgpu_compute_capability_major 8 @@ -24,11 +23,11 @@ -gpgpu_n_clusters 108 -gpgpu_n_cores_per_cluster 1 -gpgpu_n_mem 40 --gpgpu_n_sub_partition_per_mchannel 2 +-gpgpu_n_sub_partition_per_mchannel 4 # clock domains #-gpgpu_clock_domains ::: --gpgpu_clock_domains 1410:1410:1410:1512 +-gpgpu_clock_domains 1410:1410:1512:6048 # shader core pipeline config -gpgpu_shader_registers 65536 @@ -93,7 +92,7 @@ # L1 cache configuration -gpgpu_l1_banks 4 -gpgpu_cache:dl1 S:4:128:64,L:T:m:L:L,A:512:64,16:0,32 --gpgpu_l1_latency 37 +-gpgpu_l1_latency 34 -gpgpu_gmem_skip_L1D 0 -gpgpu_flush_l1_cache 1 -gpgpu_n_cluster_ejection_buffer_size 32 @@ -103,7 +102,7 @@ -gpgpu_shmem_size 167936 -gpgpu_shmem_sizeDefault 167936 -gpgpu_shmem_per_block 49152 --gpgpu_smem_latency 29 +-gpgpu_smem_latency 28 # shared memory bankconflict detection -gpgpu_shmem_num_banks 32 -gpgpu_shmem_limited_broadcast 0 @@ -111,7 +110,7 @@ -gpgpu_coalesce_arch 80 # L2 cache --gpgpu_cache:dl2 S:256:128:16,L:B:m:L:X,A:192:4,32:0,32 +-gpgpu_cache:dl2 S:128:128:16,L:B:m:L:X,A:192:4,32:0,32 -gpgpu_cache:dl2_texture_only 0 -gpgpu_dram_partition_queues 64:64:64:64 -gpgpu_perf_sim_memcpy 1 @@ -137,8 +136,8 @@ -icnt_arbiter_algo 1 # memory partition latency config --gpgpu_l2_rop_latency 224 --dram_latency 198 +-gpgpu_l2_rop_latency 200 +-dram_latency 190 # dram sched config -gpgpu_dram_scheduler 1 From 9f88572328c3b0a2127b11bd96f971c0ed9d5660 Mon Sep 17 00:00:00 2001 From: Ahmad Alawneh Date: Sun, 7 Sep 2025 22:59:38 -0400 Subject: [PATCH 2/2] Update gpgpusim.config --- configs/tested-cfgs/SM80_A100/gpgpusim.config | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/configs/tested-cfgs/SM80_A100/gpgpusim.config b/configs/tested-cfgs/SM80_A100/gpgpusim.config index 37b6b772d..cfed279cc 100644 --- a/configs/tested-cfgs/SM80_A100/gpgpusim.config +++ b/configs/tested-cfgs/SM80_A100/gpgpusim.config @@ -27,7 +27,7 @@ # clock domains #-gpgpu_clock_domains ::: --gpgpu_clock_domains 1410:1410:1512:6048 +-gpgpu_clock_domains 1410:1410:1410:1512 # shader core pipeline config -gpgpu_shader_registers 65536