cluster.py
来自「M5,一个功能强大的多处理器系统模拟器.很多针对处理器架构,性能的研究都使用它作」· Python 代码 · 共 272 行
PY
272 行
# Simple test script## "m5 test.py"import m5from m5.objects import *import os, optparse, sysm5.AddToPath('../common')# --------------------# Define Command Line Options# ====================parser = optparse.OptionParser()parser.add_option("-d", "--detailed", action="store_true")parser.add_option("-t", "--timing", action="store_true")parser.add_option("-m", "--maxtick", type="int")parser.add_option("-c", "--numclusters", help="Number of clusters", type="int")parser.add_option("-n", "--numcpus", help="Number of cpus in total", type="int")parser.add_option("-f", "--frequency", default = "1GHz", help="Frequency of each CPU")parser.add_option("--l1size", default = "32kB")parser.add_option("--l1latency", default = 1)parser.add_option("--l2size", default = "256kB")parser.add_option("--l2latency", default = 10)parser.add_option("--rootdir", help="ROot directory of Splash2", default="/dist/splash2/codes/")parser.add_option("-b", "--benchmark", help="Splash 2 benchmark to run")(options, args) = parser.parse_args()if args: print "Error: script doesn't take any positional arguments" sys.exit(1)# --------------------# Define Splash2 Benchmarks# ====================class Cholesky(LiveProcess): executable = options.rootdir + '/kernels/cholesky/CHOLESKY' cmd = 'CHOLESKY -p' + str(options.numcpus) + ' '\ + options.rootdir + '/kernels/cholesky/inputs/tk23.O'class FFT(LiveProcess): executable = options.rootdir + 'kernels/fft/FFT' cmd = 'FFT -p' + str(options.numcpus) + ' -m18'class LU_contig(LiveProcess): executable = options.rootdir + 'kernels/lu/contiguous_blocks/LU' cmd = 'LU -p' + str(options.numcpus)class LU_noncontig(LiveProcess): executable = options.rootdir + 'kernels/lu/non_contiguous_blocks/LU' cmd = 'LU -p' + str(options.numcpus)class Radix(LiveProcess): executable = options.rootdir + 'kernels/radix/RADIX' cmd = 'RADIX -n524288 -p' + str(options.numcpus)class Barnes(LiveProcess): executable = options.rootdir + 'apps/barnes/BARNES' cmd = 'BARNES' input = options.rootdir + 'apps/barnes/input.p' + str(options.numcpus)class FMM(LiveProcess): executable = options.rootdir + 'apps/fmm/FMM' cmd = 'FMM' input = options.rootdir + 'apps/fmm/inputs/input.2048.p' + str(options.numcpus)class Ocean_contig(LiveProcess): executable = options.rootdir + 'apps/ocean/contiguous_partitions/OCEAN' cmd = 'OCEAN -p' + str(options.numcpus)class Ocean_noncontig(LiveProcess): executable = options.rootdir + 'apps/ocean/non_contiguous_partitions/OCEAN' cmd = 'OCEAN -p' + str(options.numcpus)class Raytrace(LiveProcess): executable = options.rootdir + 'apps/raytrace/RAYTRACE' cmd = 'RAYTRACE -p' + str(options.numcpus) + ' ' \ + options.rootdir + 'apps/raytrace/inputs/teapot.env'class Water_nsquared(LiveProcess): executable = options.rootdir + 'apps/water-nsquared/WATER-NSQUARED' cmd = 'WATER-NSQUARED' input = options.rootdir + 'apps/water-nsquared/input.p' + str(options.numcpus)class Water_spatial(LiveProcess): executable = options.rootdir + 'apps/water-spatial/WATER-SPATIAL' cmd = 'WATER-SPATIAL' input = options.rootdir + 'apps/water-spatial/input.p' + str(options.numcpus)# --------------------# Base L1 Cache Definition# ====================class L1(BaseCache): latency = options.l1latency block_size = 64 mshrs = 12 tgts_per_mshr = 8# ----------------------# Base L2 Cache Definition# ----------------------class L2(BaseCache): block_size = 64 latency = options.l2latency mshrs = 92 tgts_per_mshr = 16 write_buffers = 8# ----------------------# Define the clusters with their cpus# ----------------------class Cluster: passcpusPerCluster = options.numcpus/options.numclustersbusFrequency = Frequency(options.frequency)busFrequency *= cpusPerClusterall_cpus = []all_l1s = []all_l1buses = []if options.timing: clusters = [ Cluster() for i in xrange(options.numclusters)] for j in xrange(options.numclusters): clusters[j].id = j for cluster in clusters: cluster.clusterbus = Bus(clock=busFrequency) all_l1buses += [cluster.clusterbus] cluster.cpus = [TimingSimpleCPU(cpu_id = i + cluster.id, clock=options.frequency) for i in xrange(cpusPerCluster)] all_cpus += cluster.cpus cluster.l1 = L1(size=options.l1size, assoc = 4) all_l1s += [cluster.l1]elif options.detailed: clusters = [ Cluster() for i in xrange(options.numclusters)] for j in xrange(options.numclusters): clusters[j].id = j for cluster in clusters: cluster.clusterbus = Bus(clock=busFrequency) all_l1buses += [cluster.clusterbus] cluster.cpus = [DerivO3CPU(cpu_id = i + cluster.id, clock=options.frequency) for i in xrange(cpusPerCluster)] all_cpus += cluster.cpus cluster.l1 = L1(size=options.l1size, assoc = 4) all_l1s += [cluster.l1]else: clusters = [ Cluster() for i in xrange(options.numclusters)] for j in xrange(options.numclusters): clusters[j].id = j for cluster in clusters: cluster.clusterbus = Bus(clock=busFrequency) all_l1buses += [cluster.clusterbus] cluster.cpus = [AtomicSimpleCPU(cpu_id = i + cluster.id, clock=options.frequency) for i in xrange(cpusPerCluster)] all_cpus += cluster.cpus cluster.l1 = L1(size=options.l1size, assoc = 4) all_l1s += [cluster.l1]# ----------------------# Create a system, and add system wide objects# ----------------------system = System(cpu = all_cpus, l1_ = all_l1s, l1bus_ = all_l1buses, physmem = PhysicalMemory(), membus = Bus(clock = busFrequency))system.toL2bus = Bus(clock = busFrequency)system.l2 = L2(size = options.l2size, assoc = 8)# ----------------------# Connect the L2 cache and memory together# ----------------------system.physmem.port = system.membus.portsystem.l2.cpu_side = system.toL2bus.portsystem.l2.mem_side = system.membus.port# ----------------------# Connect the L2 cache and clusters together# ----------------------for cluster in clusters: cluster.l1.cpu_side = cluster.clusterbus.port cluster.l1.mem_side = system.toL2bus.port for cpu in cluster.cpus: cpu.icache_port = cluster.clusterbus.port cpu.dcache_port = cluster.clusterbus.port cpu.mem = cluster.l1# ----------------------# Define the root# ----------------------root = Root(system = system)# --------------------# Pick the correct Splash2 Benchmarks# ====================if options.benchmark == 'Cholesky': root.workload = Cholesky()elif options.benchmark == 'FFT': root.workload = FFT()elif options.benchmark == 'LUContig': root.workload = LU_contig()elif options.benchmark == 'LUNoncontig': root.workload = LU_noncontig()elif options.benchmark == 'Radix': root.workload = Radix()elif options.benchmark == 'Barnes': root.workload = Barnes()elif options.benchmark == 'FMM': root.workload = FMM()elif options.benchmark == 'OceanContig': root.workload = Ocean_contig()elif options.benchmark == 'OceanNoncontig': root.workload = Ocean_noncontig()elif options.benchmark == 'Raytrace': root.workload = Raytrace()elif options.benchmark == 'WaterNSquared': root.workload = Water_nsquared()elif options.benchmark == 'WaterSpatial': root.workload = Water_spatial()else: panic("The --benchmark environment variable was set to something" \ +" improper.\nUse Cholesky, FFT, LUContig, LUNoncontig, Radix" \ +", Barnes, FMM, OceanContig,\nOceanNoncontig, Raytrace," \ +" WaterNSquared, or WaterSpatial\n")# --------------------# Assign the workload to the cpus# ====================for cluster in clusters: for cpu in cluster.cpus: cpu.workload = root.workload# ----------------------# Run the simulation# ----------------------if options.timing or options.detailed: root.system.mem_mode = 'timing'# instantiate configurationm5.instantiate(root)# simulate until program terminatesif options.maxtick: exit_event = m5.simulate(options.maxtick)else: exit_event = m5.simulate(m5.MaxTick)print 'Exiting @ tick', m5.curTick(), 'because', exit_event.getCause()
⌨️ 快捷键说明
复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?