Skip to content
Merged
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
17 changes: 8 additions & 9 deletions configs/tested-cfgs/SM80_A100/gpgpusim.config
Original file line number Diff line number Diff line change
Expand Up @@ -8,9 +8,8 @@
-gpgpu_heap_size_limit 8388608
-gpgpu_runtime_sync_depth_limit 2
-gpgpu_runtime_pending_launch_count_limit 2048
-gpgpu_kernel_launch_latency 5000
-gpgpu_kernel_launch_latency 5000
-gpgpu_TB_launch_latency 0
-gpgpu_max_concurrent_kernel 128
Copy link

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Is this removed on purpose?

Copy link
Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

nope

Copy link

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Oh wait I forgot this. Can you add back this line and open another PR? I'll force merge it. I don't even think we regress A100.


# Compute Capability
-gpgpu_compute_capability_major 8
Expand All @@ -24,11 +23,11 @@
-gpgpu_n_clusters 108
-gpgpu_n_cores_per_cluster 1
-gpgpu_n_mem 40
-gpgpu_n_sub_partition_per_mchannel 2
-gpgpu_n_sub_partition_per_mchannel 4

# clock domains
#-gpgpu_clock_domains <Core Clock>:<Interconnect Clock>:<L2 Clock>:<DRAM Clock>
-gpgpu_clock_domains 1410:1410:1410:1512
-gpgpu_clock_domains 1410:1410:1512:6048
Copy link

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Really? 6048 seems a bit high.
Also do you know how this affects sim speed?

Copy link
Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

opps that was one of the expermintes


# shader core pipeline config
-gpgpu_shader_registers 65536
Expand Down Expand Up @@ -93,7 +92,7 @@
# L1 cache configuration
-gpgpu_l1_banks 4
-gpgpu_cache:dl1 S:4:128:64,L:T:m:L:L,A:512:64,16:0,32
-gpgpu_l1_latency 37
-gpgpu_l1_latency 34
-gpgpu_gmem_skip_L1D 0
-gpgpu_flush_l1_cache 1
-gpgpu_n_cluster_ejection_buffer_size 32
Expand All @@ -103,15 +102,15 @@
-gpgpu_shmem_size 167936
-gpgpu_shmem_sizeDefault 167936
-gpgpu_shmem_per_block 49152
-gpgpu_smem_latency 29
-gpgpu_smem_latency 28
# shared memory bankconflict detection
-gpgpu_shmem_num_banks 32
-gpgpu_shmem_limited_broadcast 0
-gpgpu_shmem_warp_parts 1
-gpgpu_coalesce_arch 80

# L2 cache
-gpgpu_cache:dl2 S:256:128:16,L:B:m:L:X,A:192:4,32:0,32
-gpgpu_cache:dl2 S:128:128:16,L:B:m:L:X,A:192:4,32:0,32
-gpgpu_cache:dl2_texture_only 0
-gpgpu_dram_partition_queues 64:64:64:64
-gpgpu_perf_sim_memcpy 1
Expand All @@ -137,8 +136,8 @@
-icnt_arbiter_algo 1

# memory partition latency config
-gpgpu_l2_rop_latency 224
-dram_latency 198
-gpgpu_l2_rop_latency 200
-dram_latency 190

# dram sched config
-gpgpu_dram_scheduler 1
Expand Down