|
8 | 8 | -gpgpu_heap_size_limit 8388608
|
9 | 9 | -gpgpu_runtime_sync_depth_limit 2
|
10 | 10 | -gpgpu_runtime_pending_launch_count_limit 2048
|
11 |
| --gpgpu_kernel_launch_latency 5000 |
| 11 | +-gpgpu_kernel_launch_latency 5000 |
12 | 12 | -gpgpu_TB_launch_latency 0
|
13 |
| --gpgpu_max_concurrent_kernel 128 |
14 | 13 |
|
15 | 14 | # Compute Capability
|
16 | 15 | -gpgpu_compute_capability_major 8
|
|
24 | 23 | -gpgpu_n_clusters 108
|
25 | 24 | -gpgpu_n_cores_per_cluster 1
|
26 | 25 | -gpgpu_n_mem 40
|
27 |
| --gpgpu_n_sub_partition_per_mchannel 2 |
| 26 | +-gpgpu_n_sub_partition_per_mchannel 4 |
28 | 27 |
|
29 | 28 | # clock domains
|
30 | 29 | #-gpgpu_clock_domains <Core Clock>:<Interconnect Clock>:<L2 Clock>:<DRAM Clock>
|
|
93 | 92 | # L1 cache configuration
|
94 | 93 | -gpgpu_l1_banks 4
|
95 | 94 | -gpgpu_cache:dl1 S:4:128:64,L:T:m:L:L,A:512:64,16:0,32
|
96 |
| --gpgpu_l1_latency 37 |
| 95 | +-gpgpu_l1_latency 34 |
97 | 96 | -gpgpu_gmem_skip_L1D 0
|
98 | 97 | -gpgpu_flush_l1_cache 1
|
99 | 98 | -gpgpu_n_cluster_ejection_buffer_size 32
|
|
103 | 102 | -gpgpu_shmem_size 167936
|
104 | 103 | -gpgpu_shmem_sizeDefault 167936
|
105 | 104 | -gpgpu_shmem_per_block 49152
|
106 |
| --gpgpu_smem_latency 29 |
| 105 | +-gpgpu_smem_latency 28 |
107 | 106 | # shared memory bankconflict detection
|
108 | 107 | -gpgpu_shmem_num_banks 32
|
109 | 108 | -gpgpu_shmem_limited_broadcast 0
|
110 | 109 | -gpgpu_shmem_warp_parts 1
|
111 | 110 | -gpgpu_coalesce_arch 80
|
112 | 111 |
|
113 | 112 | # L2 cache
|
114 |
| --gpgpu_cache:dl2 S:256:128:16,L:B:m:L:X,A:192:4,32:0,32 |
| 113 | +-gpgpu_cache:dl2 S:128:128:16,L:B:m:L:X,A:192:4,32:0,32 |
115 | 114 | -gpgpu_cache:dl2_texture_only 0
|
116 | 115 | -gpgpu_dram_partition_queues 64:64:64:64
|
117 | 116 | -gpgpu_perf_sim_memcpy 1
|
|
137 | 136 | -icnt_arbiter_algo 1
|
138 | 137 |
|
139 | 138 | # memory partition latency config
|
140 |
| --gpgpu_l2_rop_latency 224 |
141 |
| --dram_latency 198 |
| 139 | +-gpgpu_l2_rop_latency 200 |
| 140 | +-dram_latency 190 |
142 | 141 |
|
143 | 142 | # dram sched config
|
144 | 143 | -gpgpu_dram_scheduler 1
|
|
0 commit comments