diff --git a/configs/tested-cfgs/SM80_A100/gpgpusim.config b/configs/tested-cfgs/SM80_A100/gpgpusim.config index 35f6d18ed..cfed279cc 100644 --- a/configs/tested-cfgs/SM80_A100/gpgpusim.config +++ b/configs/tested-cfgs/SM80_A100/gpgpusim.config @@ -8,9 +8,8 @@ -gpgpu_heap_size_limit 8388608 -gpgpu_runtime_sync_depth_limit 2 -gpgpu_runtime_pending_launch_count_limit 2048 --gpgpu_kernel_launch_latency 5000 +-gpgpu_kernel_launch_latency 5000 -gpgpu_TB_launch_latency 0 --gpgpu_max_concurrent_kernel 128 # Compute Capability -gpgpu_compute_capability_major 8 @@ -24,7 +23,7 @@ -gpgpu_n_clusters 108 -gpgpu_n_cores_per_cluster 1 -gpgpu_n_mem 40 --gpgpu_n_sub_partition_per_mchannel 2 +-gpgpu_n_sub_partition_per_mchannel 4 # clock domains #-gpgpu_clock_domains ::: @@ -93,7 +92,7 @@ # L1 cache configuration -gpgpu_l1_banks 4 -gpgpu_cache:dl1 S:4:128:64,L:T:m:L:L,A:512:64,16:0,32 --gpgpu_l1_latency 37 +-gpgpu_l1_latency 34 -gpgpu_gmem_skip_L1D 0 -gpgpu_flush_l1_cache 1 -gpgpu_n_cluster_ejection_buffer_size 32 @@ -103,7 +102,7 @@ -gpgpu_shmem_size 167936 -gpgpu_shmem_sizeDefault 167936 -gpgpu_shmem_per_block 49152 --gpgpu_smem_latency 29 +-gpgpu_smem_latency 28 # shared memory bankconflict detection -gpgpu_shmem_num_banks 32 -gpgpu_shmem_limited_broadcast 0 @@ -111,7 +110,7 @@ -gpgpu_coalesce_arch 80 # L2 cache --gpgpu_cache:dl2 S:256:128:16,L:B:m:L:X,A:192:4,32:0,32 +-gpgpu_cache:dl2 S:128:128:16,L:B:m:L:X,A:192:4,32:0,32 -gpgpu_cache:dl2_texture_only 0 -gpgpu_dram_partition_queues 64:64:64:64 -gpgpu_perf_sim_memcpy 1 @@ -137,8 +136,8 @@ -icnt_arbiter_algo 1 # memory partition latency config --gpgpu_l2_rop_latency 224 --dram_latency 198 +-gpgpu_l2_rop_latency 200 +-dram_latency 190 # dram sched config -gpgpu_dram_scheduler 1