ghb_pacman_m.cfg 1.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566
  1. # Configuration file for Xeon X5550 Gainestown
  2. # See http://en.wikipedia.org/wiki/Gainestown_(microprocessor)#Gainestown
  3. # and http://ark.intel.com/products/37106
  4. #include nehalem
  5. [perf_model/l2_cache]
  6. prefetcher = ghb
  7. [perf_model/l2_cache/prefetcher]
  8. prefetch_on_prefetch_hit = true # Do prefetches only on miss (false), or also on hits to lines brought in by the prefetcher (true)
  9. [perf_model/l2_cache/prefetcher/ghb]
  10. width = 2
  11. depth = 2
  12. ghb_size = 512
  13. ghb_table_size = 512
  14. [perf_model/core]
  15. frequency = 2.66
  16. [perf_model/l3_cache]
  17. perfect = false
  18. cache_block_size = 64
  19. cache_size = 4096
  20. associativity = 16
  21. address_hash = mask
  22. replacement_policy = rrip_pacman
  23. drrip = true
  24. data_access_time = 30 # 35 cycles total according to membench, +L1+L2 tag times
  25. tags_access_time = 10
  26. perf_model_type = parallel
  27. writethrough = 0
  28. shared_cores = 8
  29. [perf_model/l3_cache/rrip]
  30. pacman_m = true
  31. bits = 2,2,2,2
  32. [perf_model/dram_directory]
  33. # total_entries = number of entries per directory controller.
  34. total_entries = 1048576
  35. associativity = 16
  36. directory_type = full_map
  37. [perf_model/dram]
  38. # -1 means that we have a number of distributed DRAM controllers (4 in this case)
  39. num_controllers = -1
  40. controllers_interleaving = 4
  41. # DRAM access latency in nanoseconds. Should not include L1-LLC tag access time, directory access time (14 cycles = 5.2 ns),
  42. # or network time [(cache line size + 2*{overhead=40}) / network bandwidth = 18 ns]
  43. # Membench says 175 cycles @ 2.66 GHz = 66 ns total
  44. latency = 45
  45. per_controller_bandwidth = 7.6 # In GB/s, as measured by core_validation-dram
  46. chips_per_dimm = 8
  47. dimms_per_controller = 4
  48. [network]
  49. memory_model_1 = bus
  50. memory_model_2 = bus
  51. [network/bus]
  52. bandwidth = 25.6 # in GB/s. Actually, it's 12.8 GB/s per direction and per connected chip pair
  53. ignore_local_traffic = true # Memory controllers are on-chip, so traffic from core0 to dram0 does not use the QPI links