xref: /xnu-11215.81.4/tests/counter/benchmark.lua (revision d4514f0bc1d3f944c22d92e68b646ac3fb40d452)
1*d4514f0bSApple OSS Distributions#!/usr/local/bin/recon
2*d4514f0bSApple OSS Distributionsrequire 'strict'
3*d4514f0bSApple OSS Distributions
4*d4514f0bSApple OSS Distributionslocal benchrun = require 'benchrun'
5*d4514f0bSApple OSS Distributionslocal perfdata = require 'perfdata'
6*d4514f0bSApple OSS Distributionslocal sysctl = require 'sysctl'
7*d4514f0bSApple OSS Distributionslocal csv = require 'csv'
8*d4514f0bSApple OSS Distributions
9*d4514f0bSApple OSS Distributionslocal kDefaultNumWrites = 10000000000
10*d4514f0bSApple OSS Distributions
11*d4514f0bSApple OSS Distributionslocal benchmark = benchrun.new {
12*d4514f0bSApple OSS Distributions    name = 'xnu.per_cpu_counter',
13*d4514f0bSApple OSS Distributions    version = 1,
14*d4514f0bSApple OSS Distributions    arg = arg,
15*d4514f0bSApple OSS Distributions    modify_argparser = function(parser)
16*d4514f0bSApple OSS Distributions        parser:argument{
17*d4514f0bSApple OSS Distributions          name = 'path',
18*d4514f0bSApple OSS Distributions          description = 'Path to benchmark binary'
19*d4514f0bSApple OSS Distributions        }
20*d4514f0bSApple OSS Distributions        parser:option{
21*d4514f0bSApple OSS Distributions            name = '--cpu-workers',
22*d4514f0bSApple OSS Distributions            description = 'Number of cpu workers'
23*d4514f0bSApple OSS Distributions        }
24*d4514f0bSApple OSS Distributions        parser:flag{
25*d4514f0bSApple OSS Distributions          name = '--through-max-workers',
26*d4514f0bSApple OSS Distributions          description = 'Run benchmark for [1..n] cpu workers'
27*d4514f0bSApple OSS Distributions        }
28*d4514f0bSApple OSS Distributions        parser:flag{
29*d4514f0bSApple OSS Distributions          name = '--through-max-workers-fast',
30*d4514f0bSApple OSS Distributions          description = 'Run benchmark for [1..2] and each power of four value in [4..n] cpu workers'
31*d4514f0bSApple OSS Distributions        }
32*d4514f0bSApple OSS Distributions        parser:option {
33*d4514f0bSApple OSS Distributions            name = "--num-writes",
34*d4514f0bSApple OSS Distributions            description = "number of writes",
35*d4514f0bSApple OSS Distributions            default = kDefaultNumWrites
36*d4514f0bSApple OSS Distributions        }
37*d4514f0bSApple OSS Distributions        parser:option{
38*d4514f0bSApple OSS Distributions            name = '--variant',
39*d4514f0bSApple OSS Distributions            description = 'Which benchmark variant to run (scalable, atomic, or racy)',
40*d4514f0bSApple OSS Distributions            default = 'scalable',
41*d4514f0bSApple OSS Distributions            choices = {"scalable", "atomic", "racy"}
42*d4514f0bSApple OSS Distributions        }
43*d4514f0bSApple OSS Distributions    end
44*d4514f0bSApple OSS Distributions}
45*d4514f0bSApple OSS Distributions
46*d4514f0bSApple OSS Distributionsassert(benchmark.opt.path, "No path supplied for fault throughput binary")
47*d4514f0bSApple OSS Distributions
48*d4514f0bSApple OSS Distributionslocal ncpus, err = sysctl('hw.logicalcpu_max')
49*d4514f0bSApple OSS Distributionsassert(ncpus > 0, 'invalid number of logical cpus')
50*d4514f0bSApple OSS Distributionslocal cpu_workers = tonumber(benchmark.opt.cpu_workers) or ncpus
51*d4514f0bSApple OSS Distributions
52*d4514f0bSApple OSS Distributionslocal writes_per_second = perfdata.unit.custom('writes/sec')
53*d4514f0bSApple OSS Distributionslocal tests = {}
54*d4514f0bSApple OSS Distributions
55*d4514f0bSApple OSS Distributionsfunction QueueTest(num_cores)
56*d4514f0bSApple OSS Distributions    table.insert(tests, {
57*d4514f0bSApple OSS Distributions        path = benchmark.opt.path,
58*d4514f0bSApple OSS Distributions        num_cores = num_cores,
59*d4514f0bSApple OSS Distributions    })
60*d4514f0bSApple OSS Distributionsend
61*d4514f0bSApple OSS Distributions
62*d4514f0bSApple OSS Distributionsif benchmark.opt.through_max_workers then
63*d4514f0bSApple OSS Distributions    for i = 1, cpu_workers do
64*d4514f0bSApple OSS Distributions        QueueTest(i)
65*d4514f0bSApple OSS Distributions    end
66*d4514f0bSApple OSS Distributionselseif benchmark.opt.through_max_workers_fast then
67*d4514f0bSApple OSS Distributions    local i = 1
68*d4514f0bSApple OSS Distributions    while i <= cpu_workers do
69*d4514f0bSApple OSS Distributions        QueueTest(i)
70*d4514f0bSApple OSS Distributions        -- Always do a run with two threads to see what the first part of
71*d4514f0bSApple OSS Distributions        -- the scaling curve looks like
72*d4514f0bSApple OSS Distributions        -- (and to measure perf on dual core systems).
73*d4514f0bSApple OSS Distributions        if i == 1 and cpu_workers >= 2 then
74*d4514f0bSApple OSS Distributions            QueueTest(i + 1)
75*d4514f0bSApple OSS Distributions        end
76*d4514f0bSApple OSS Distributions        i = i * 4
77*d4514f0bSApple OSS Distributions    end
78*d4514f0bSApple OSS Distributionselse
79*d4514f0bSApple OSS Distributions    QueueTest(cpu_workers)
80*d4514f0bSApple OSS Distributionsend
81*d4514f0bSApple OSS Distributions
82*d4514f0bSApple OSS Distributionsfor _, test in ipairs(tests) do
83*d4514f0bSApple OSS Distributions    local args = {test.path, benchmark.opt.variant, benchmark.opt.num_writes, test.num_cores,
84*d4514f0bSApple OSS Distributions                     echo = true}
85*d4514f0bSApple OSS Distributions    for out in benchmark:run(args) do
86*d4514f0bSApple OSS Distributions        local result = out:match("-----Results-----\n(.*)")
87*d4514f0bSApple OSS Distributions        benchmark:assert(result, "Unable to find result data in output")
88*d4514f0bSApple OSS Distributions        local data = csv.openstring(result, {header = true})
89*d4514f0bSApple OSS Distributions        for field in data:lines() do
90*d4514f0bSApple OSS Distributions            for k, v in pairs(field) do
91*d4514f0bSApple OSS Distributions                local unit = writes_per_second
92*d4514f0bSApple OSS Distributions                local larger_better = true
93*d4514f0bSApple OSS Distributions                if k == "loss" then
94*d4514f0bSApple OSS Distributions                    unit = percentage
95*d4514f0bSApple OSS Distributions                    larger_better = false
96*d4514f0bSApple OSS Distributions                end
97*d4514f0bSApple OSS Distributions                benchmark.writer:add_value(k, unit, tonumber(v), {
98*d4514f0bSApple OSS Distributions                  [perfdata.larger_better] = larger_better,
99*d4514f0bSApple OSS Distributions                  threads = test.num_cores,
100*d4514f0bSApple OSS Distributions                  variant = benchmark.opt.variant
101*d4514f0bSApple OSS Distributions                })
102*d4514f0bSApple OSS Distributions            end
103*d4514f0bSApple OSS Distributions        end
104*d4514f0bSApple OSS Distributions    end
105*d4514f0bSApple OSS Distributionsend
106*d4514f0bSApple OSS Distributions
107*d4514f0bSApple OSS Distributionsbenchmark:finish()
108