metagraphoptimization.jl/examples/qed_bench.jl

using MetagraphOptimization
using LIKWID
using CUDA
using UUIDs
using DataFrames
using CSV
using Random

DISABLE_GPU = true

results_filename = "results.csv"

df = DataFrame(
    process_name = String[],
    graph_gen_time = Float64[],
    optimization_time = Float64[],
    function_generation_time = Float64[],
    graph_nodes = Int[],
    graph_edges = Int[],
    graph_mem = Float64[],
    cpu_threads = Int[],
    n_inputs = Int[],
    nflops_likwid = Int[],
    cpu_time = Float64[],
    cpu_rate = Float64[],
    cpu_gflops = Float64[],
    gpu_name = String[],
    gpu_time = Float64[],
    gpu_rate = Float64[],
    gpu_gflops = Float64[],
)

# if they exist, read existing results and append new ones
if isfile(results_filename)
    df = CSV.read(results_filename, DataFrame)
end

nInputs = 100_000

function cpu_bench(compute_function, inputs)
    compute_function.(inputs[begin:10]) # make sure it's compiled

    time = @elapsed Threads.@threads for i in eachindex(inputs)
        @invokelatest compute_function(inputs[i])
    end
    rate = length(inputs) / time
    return (time, rate)
end

function gpu_bench(compute_function, inputs)
    CUDA.@sync compute_function.(inputs[begin:10])  # make sure it's compiled

    time = @elapsed CUDA.@sync compute_function.(inputs)
    rate = length(inputs) / time

    return (time, rate)
end

function bench_process(
    process::MetagraphOptimization.AbstractProcessDescription,
    process_name::String,
    graph::DAG,
    func,
    gen_time::Float64,
    opt_time::Float64,
    func_time::Float64,
    io::IO = stdout;
    use_likwid = true,
    use_gpu = true,
)
    println(io, "\n--- Benchmarking $(process_name) ---")
    if DISABLE_GPU
        use_gpu = false
    end

    graph_props = GraphProperties(graph)
    NFLOPs = graph_props.computeEffort
    nflops_likwid = 0
    if use_likwid
        input = gen_process_input(process)
        func(input) # compile first

        # get rid of annoying output to console
        oldstd = stdout
        redirect_stdout(devnull)
        _, events = @perfmon "FLOPS_DP" func(input)
        redirect_stdout(oldstd) # recover original stdout

        NFLOPs = first(events["FLOPS_DP"])["RETIRED_SSE_AVX_FLOPS_ALL"]
        nflops_likwid = NFLOPs
    end

    println(io, "Generating $nInputs inputs with $(Threads.nthreads()) threads...")

    inputs = Vector{typeof(gen_process_input(process))}()
    resize!(inputs, nInputs)
    processes = Vector{typeof(process)}()
    for i in 1:Threads.nthreads()
        push!(processes, copy(process))
    end

    Threads.@threads for i in eachindex(inputs)
        inputs[i] = gen_process_input(processes[Threads.nthreads()])
    end

    println(io, "Benchmarking CPU with $(Threads.nthreads()) threads...")
    (time_cpu, rate_cpu) = cpu_bench(func, inputs)
    flops_cpu = (rate_cpu * NFLOPs) / 10^9

    time_gpu = 0.0
    rate_gpu = 0.0
    flops_gpu = 0.0
    gpu_name = "none"
    if use_gpu
        println(io, "Benchmarking GPU...")
        gpu_name = "$(name(first(CUDA.devices())))"
        cuInputs = CuArray(inputs)
        (time_gpu, rate_gpu) = gpu_bench(func, cuInputs)
        flops_gpu = (rate_gpu * NFLOPs) / 10^9
    else
        println(io, "Skipping GPU...")
    end

    println(io, "\nBenchmark Summary for $(process):")

    if use_likwid
        println(io, "Measured FLOPS by LIKWID: $NFLOPs")
    else
        println(io, "Total graph compute effort: $NFLOPs")
    end
    println(io, "Total input size: $(bytes_to_human_readable(Base.summarysize(inputs)))")
    println(io, "CPU, $(Threads.nthreads()) threads")
    println(io, "  Time:  $time_cpu")
    println(io, "  Rate:  $rate_cpu")
    println(io, "  GFLOPS: $flops_cpu")
    if use_gpu
        println(io, "GPU, $gpu_name")
        println(io, "  Time:  $time_gpu")
        println(io, "  Rate:  $rate_gpu")
        println(io, "  GFLOPS: $flops_gpu")
    end

    if (process_name != "warmup")
        push!(
            df,
            Dict(
                :process_name => process_name,
                :graph_gen_time => gen_time,
                :optimization_time => opt_time,
                :function_generation_time => func_time,
                :graph_nodes => graph_props.noNodes,
                :graph_edges => graph_props.noEdges,
                :graph_mem => MetagraphOptimization.mem(graph),
                :cpu_threads => Threads.nthreads(),
                :n_inputs => nInputs,
                :nflops_likwid => nflops_likwid,
                :cpu_time => time_cpu,
                :cpu_rate => rate_cpu,
                :cpu_gflops => flops_cpu,
                :gpu_name => gpu_name,
                :gpu_time => time_gpu,
                :gpu_rate => rate_gpu,
                :gpu_gflops => flops_gpu,
            ),
        )
    end

    return nothing
end

# use "mock" machine that only uses cpu
machine = Machine(
    [
        MetagraphOptimization.NumaNode(
            0,
            1,
            MetagraphOptimization.default_strategy(MetagraphOptimization.NumaNode),
            -1.0,
            UUIDs.uuid1(),
        ),
    ],
    [-1.0;;],
)

# sadly cannot put these in functions because the world age must increase after the function is created which happens only in the global scope

## -- WARMUP TO COMPILE FUNCTIONS first

optimizer = RandomWalkOptimizer(MersenneTwister(0))

# 2-photon compton
process = parse_process("ke->kke", QEDModel())
gen_time = @elapsed graph = gen_graph(process)
opt_time = @elapsed optimize!(optimizer, graph, 200)
func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)
bench_process(process, "warmup", graph, compute_func, gen_time, opt_time, func_gen_time)

optimizer = ReductionOptimizer()

# AB->AB^3
process = parse_process("AB->ABBB", ABCModel())
gen_time = @elapsed graph = parse_dag("input/AB->ABBB.txt", ABCModel())
opt_time = @elapsed optimize_to_fixpoint!(optimizer, graph)
func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)
bench_process(process, "warmup", graph, compute_func, gen_time, opt_time, func_gen_time)

## -- WARMUP END

optimizer = ReductionOptimizer()

# compton
process = parse_process("ke->ke", QEDModel())
gen_time = @elapsed graph = gen_graph(process)
func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)
bench_process(process, "$process no optimization", graph, compute_func, gen_time, 0.0, func_gen_time)

opt_time = @elapsed optimize_to_fixpoint!(optimizer, graph)
func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)
bench_process(process, "$process reduced", graph, compute_func, gen_time, opt_time, func_gen_time)

# 2-photon compton
process = parse_process("ke->kke", QEDModel())
gen_time = @elapsed graph = gen_graph(process)
func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)
bench_process(process, "$process no optimization", graph, compute_func, gen_time, 0.0, func_gen_time)

opt_time = @elapsed optimize_to_fixpoint!(optimizer, graph)
func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)
bench_process(process, "$process reduced", graph, compute_func, gen_time, opt_time, func_gen_time)

# 3-photon compton
process = parse_process("ke->kkke", QEDModel())
gen_time = @elapsed graph = gen_graph(process)
func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)
bench_process(process, "$process no optimization", graph, compute_func, gen_time, 0.0, func_gen_time)

opt_time = @elapsed optimize_to_fixpoint!(optimizer, graph)
func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)
bench_process(process, "$process reduced", graph, compute_func, gen_time, opt_time, func_gen_time)

# 4-photon compton
process = parse_process("ke->kkkke", QEDModel())
gen_time = @elapsed graph = gen_graph(process)
func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)
bench_process(process, "$process no optimization", graph, compute_func, gen_time, 0.0, func_gen_time, use_gpu = false)

opt_time = @elapsed optimize_to_fixpoint!(optimizer, graph)
func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)
bench_process(process, "$process reduced", graph, compute_func, gen_time, opt_time, func_gen_time)

# 5-photon compton
process = parse_process("ke->kkkkke", QEDModel())
gen_time = @elapsed graph = gen_graph(process)
func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)
bench_process(process, "$process no optimization", graph, compute_func, gen_time, 0.0, func_gen_time, use_gpu = false)

opt_time = @elapsed optimize_to_fixpoint!(optimizer, graph)
func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)
bench_process(process, "$process reduced", graph, compute_func, gen_time, opt_time, func_gen_time, use_gpu = false)

# 6-photon compton
process = parse_process("ke->kkkkkke", QEDModel())
gen_time = @elapsed graph = gen_graph(process)
opt_time = @elapsed optimize_to_fixpoint!(optimizer, graph)
func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)
bench_process(process, "$process reduced", graph, compute_func, gen_time, opt_time, func_gen_time, use_gpu = false)

# AB->AB
process = parse_process("AB->AB", ABCModel())
gen_time = @elapsed graph = parse_dag("input/AB->AB.txt", ABCModel())
func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)
bench_process(process, "$process no optimization", graph, compute_func, gen_time, 0.0, func_gen_time)

opt_time = @elapsed optimize_to_fixpoint!(optimizer, graph)
func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)
bench_process(process, "$process reduced", graph, compute_func, gen_time, opt_time, func_gen_time)

# AB->AB^3
process = parse_process("AB->ABBB", ABCModel())
gen_time = @elapsed graph = parse_dag("input/AB->ABBB.txt", ABCModel())
func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)
bench_process(process, "$process no optimization", graph, compute_func, gen_time, 0.0, func_gen_time)

opt_time = @elapsed optimize_to_fixpoint!(optimizer, graph)
func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)
bench_process(process, "$process reduced", graph, compute_func, gen_time, opt_time, func_gen_time)

# AB->AB^5
process = parse_process("AB->ABBBBB", ABCModel())
gen_time = @elapsed graph = parse_dag("input/AB->ABBBBB.txt", ABCModel())
func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)
bench_process(process, "$process no optimization", graph, compute_func, gen_time, 0.0, func_gen_time, use_gpu = false)

opt_time = @elapsed optimize_to_fixpoint!(optimizer, graph)
func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)
bench_process(process, "$process reduced", graph, compute_func, gen_time, opt_time, func_gen_time, use_gpu = false)

CSV.write(results_filename, df)
heterogeneity (#27) Prepare things to work with heterogeneity, make things work on GPU Reviewed-on: https://code.woubery.com/Rubydragon/MetagraphOptimization.jl/pulls/27 Co-authored-by: Anton Reinhard <anton.reinhard@proton.me> Co-committed-by: Anton Reinhard <anton.reinhard@proton.me> 2023-12-18 14:31:52 +01:00			`using MetagraphOptimization`
			`using LIKWID`
			`using CUDA`
			`using UUIDs`
Add qed bench run script and singularity container 2024-02-02 06:56:16 +01:00			`using DataFrames`
			`using CSV`
			`using Random`

Add evaluation script, run script, csv data and first plots 2024-02-06 09:35:04 +01:00			`DISABLE_GPU = true`
Add qed bench run script and singularity container 2024-02-02 06:56:16 +01:00
			`results_filename = "results.csv"`

			`df = DataFrame(`
			`process_name = String[],`
			`graph_gen_time = Float64[],`
			`optimization_time = Float64[],`
			`function_generation_time = Float64[],`
			`graph_nodes = Int[],`
			`graph_edges = Int[],`
			`graph_mem = Float64[],`
			`cpu_threads = Int[],`
			`n_inputs = Int[],`
			`nflops_likwid = Int[],`
			`cpu_time = Float64[],`
			`cpu_rate = Float64[],`
			`cpu_gflops = Float64[],`
			`gpu_name = String[],`
			`gpu_time = Float64[],`
			`gpu_rate = Float64[],`
			`gpu_gflops = Float64[],`
			`)`

			`# if they exist, read existing results and append new ones`
			`if isfile(results_filename)`
			`df = CSV.read(results_filename, DataFrame)`
			`end`

			`nInputs = 100_000`
heterogeneity (#27) Prepare things to work with heterogeneity, make things work on GPU Reviewed-on: https://code.woubery.com/Rubydragon/MetagraphOptimization.jl/pulls/27 Co-authored-by: Anton Reinhard <anton.reinhard@proton.me> Co-committed-by: Anton Reinhard <anton.reinhard@proton.me> 2023-12-18 14:31:52 +01:00
			`function cpu_bench(compute_function, inputs)`
			`compute_function.(inputs[begin:10]) # make sure it's compiled`

			`time = @elapsed Threads.@threads for i in eachindex(inputs)`
			`@invokelatest compute_function(inputs[i])`
			`end`
			`rate = length(inputs) / time`
			`return (time, rate)`
			`end`

			`function gpu_bench(compute_function, inputs)`
			`CUDA.@sync compute_function.(inputs[begin:10]) # make sure it's compiled`

			`time = @elapsed CUDA.@sync compute_function.(inputs)`
			`rate = length(inputs) / time`

			`return (time, rate)`
			`end`

			`function bench_process(`
			`process::MetagraphOptimization.AbstractProcessDescription,`
Add qed bench run script and singularity container 2024-02-02 06:56:16 +01:00			`process_name::String,`
			`graph::DAG,`
heterogeneity (#27) Prepare things to work with heterogeneity, make things work on GPU Reviewed-on: https://code.woubery.com/Rubydragon/MetagraphOptimization.jl/pulls/27 Co-authored-by: Anton Reinhard <anton.reinhard@proton.me> Co-committed-by: Anton Reinhard <anton.reinhard@proton.me> 2023-12-18 14:31:52 +01:00			`func,`
Add qed bench run script and singularity container 2024-02-02 06:56:16 +01:00			`gen_time::Float64,`
			`opt_time::Float64,`
			`func_time::Float64,`
heterogeneity (#27) Prepare things to work with heterogeneity, make things work on GPU Reviewed-on: https://code.woubery.com/Rubydragon/MetagraphOptimization.jl/pulls/27 Co-authored-by: Anton Reinhard <anton.reinhard@proton.me> Co-committed-by: Anton Reinhard <anton.reinhard@proton.me> 2023-12-18 14:31:52 +01:00			`io::IO = stdout;`
			`use_likwid = true,`
Add qed bench run script and singularity container 2024-02-02 06:56:16 +01:00			`use_gpu = true,`
heterogeneity (#27) Prepare things to work with heterogeneity, make things work on GPU Reviewed-on: https://code.woubery.com/Rubydragon/MetagraphOptimization.jl/pulls/27 Co-authored-by: Anton Reinhard <anton.reinhard@proton.me> Co-committed-by: Anton Reinhard <anton.reinhard@proton.me> 2023-12-18 14:31:52 +01:00			`)`
Add qed bench run script and singularity container 2024-02-02 06:56:16 +01:00			`println(io, "\n--- Benchmarking $(process_name) ---")`
			`if DISABLE_GPU`
			`use_gpu = false`
			`end`
heterogeneity (#27) Prepare things to work with heterogeneity, make things work on GPU Reviewed-on: https://code.woubery.com/Rubydragon/MetagraphOptimization.jl/pulls/27 Co-authored-by: Anton Reinhard <anton.reinhard@proton.me> Co-committed-by: Anton Reinhard <anton.reinhard@proton.me> 2023-12-18 14:31:52 +01:00
Add qed bench run script and singularity container 2024-02-02 06:56:16 +01:00			`graph_props = GraphProperties(graph)`
			`NFLOPs = graph_props.computeEffort`
			`nflops_likwid = 0`
heterogeneity (#27) Prepare things to work with heterogeneity, make things work on GPU Reviewed-on: https://code.woubery.com/Rubydragon/MetagraphOptimization.jl/pulls/27 Co-authored-by: Anton Reinhard <anton.reinhard@proton.me> Co-committed-by: Anton Reinhard <anton.reinhard@proton.me> 2023-12-18 14:31:52 +01:00			`if use_likwid`
			`input = gen_process_input(process)`
			`func(input) # compile first`
Add qed bench run script and singularity container 2024-02-02 06:56:16 +01:00
			`# get rid of annoying output to console`
			`oldstd = stdout`
			`redirect_stdout(devnull)`
heterogeneity (#27) Prepare things to work with heterogeneity, make things work on GPU Reviewed-on: https://code.woubery.com/Rubydragon/MetagraphOptimization.jl/pulls/27 Co-authored-by: Anton Reinhard <anton.reinhard@proton.me> Co-committed-by: Anton Reinhard <anton.reinhard@proton.me> 2023-12-18 14:31:52 +01:00			`_, events = @perfmon "FLOPS_DP" func(input)`
Add qed bench run script and singularity container 2024-02-02 06:56:16 +01:00			`redirect_stdout(oldstd) # recover original stdout`

heterogeneity (#27) Prepare things to work with heterogeneity, make things work on GPU Reviewed-on: https://code.woubery.com/Rubydragon/MetagraphOptimization.jl/pulls/27 Co-authored-by: Anton Reinhard <anton.reinhard@proton.me> Co-committed-by: Anton Reinhard <anton.reinhard@proton.me> 2023-12-18 14:31:52 +01:00			`NFLOPs = first(events["FLOPS_DP"])["RETIRED_SSE_AVX_FLOPS_ALL"]`
Add qed bench run script and singularity container 2024-02-02 06:56:16 +01:00			`nflops_likwid = NFLOPs`
heterogeneity (#27) Prepare things to work with heterogeneity, make things work on GPU Reviewed-on: https://code.woubery.com/Rubydragon/MetagraphOptimization.jl/pulls/27 Co-authored-by: Anton Reinhard <anton.reinhard@proton.me> Co-committed-by: Anton Reinhard <anton.reinhard@proton.me> 2023-12-18 14:31:52 +01:00			`end`

			`println(io, "Generating $nInputs inputs with $(Threads.nthreads()) threads...")`

			`inputs = Vector{typeof(gen_process_input(process))}()`
			`resize!(inputs, nInputs)`
			`processes = Vector{typeof(process)}()`
			`for i in 1:Threads.nthreads()`
			`push!(processes, copy(process))`
			`end`

			`Threads.@threads for i in eachindex(inputs)`
			`inputs[i] = gen_process_input(processes[Threads.nthreads()])`
			`end`

			`println(io, "Benchmarking CPU with $(Threads.nthreads()) threads...")`
			`(time_cpu, rate_cpu) = cpu_bench(func, inputs)`
Add qed bench run script and singularity container 2024-02-02 06:56:16 +01:00			`flops_cpu = (rate_cpu * NFLOPs) / 10^9`
heterogeneity (#27) Prepare things to work with heterogeneity, make things work on GPU Reviewed-on: https://code.woubery.com/Rubydragon/MetagraphOptimization.jl/pulls/27 Co-authored-by: Anton Reinhard <anton.reinhard@proton.me> Co-committed-by: Anton Reinhard <anton.reinhard@proton.me> 2023-12-18 14:31:52 +01:00
Add qed bench run script and singularity container 2024-02-02 06:56:16 +01:00			`time_gpu = 0.0`
			`rate_gpu = 0.0`
			`flops_gpu = 0.0`
			`gpu_name = "none"`
			`if use_gpu`
			`println(io, "Benchmarking GPU...")`
			`gpu_name = "$(name(first(CUDA.devices())))"`
			`cuInputs = CuArray(inputs)`
			`(time_gpu, rate_gpu) = gpu_bench(func, cuInputs)`
			`flops_gpu = (rate_gpu * NFLOPs) / 10^9`
			`else`
			`println(io, "Skipping GPU...")`
			`end`
heterogeneity (#27) Prepare things to work with heterogeneity, make things work on GPU Reviewed-on: https://code.woubery.com/Rubydragon/MetagraphOptimization.jl/pulls/27 Co-authored-by: Anton Reinhard <anton.reinhard@proton.me> Co-committed-by: Anton Reinhard <anton.reinhard@proton.me> 2023-12-18 14:31:52 +01:00
			`println(io, "\nBenchmark Summary for $(process):")`

			`if use_likwid`
			`println(io, "Measured FLOPS by LIKWID: $NFLOPs")`
			`else`
			`println(io, "Total graph compute effort: $NFLOPs")`
			`end`
			`println(io, "Total input size: $(bytes_to_human_readable(Base.summarysize(inputs)))")`
			`println(io, "CPU, $(Threads.nthreads()) threads")`
			`println(io, " Time: $time_cpu")`
			`println(io, " Rate: $rate_cpu")`
			`println(io, " GFLOPS: $flops_cpu")`
Add qed bench run script and singularity container 2024-02-02 06:56:16 +01:00			`if use_gpu`
			`println(io, "GPU, $gpu_name")`
			`println(io, " Time: $time_gpu")`
			`println(io, " Rate: $rate_gpu")`
			`println(io, " GFLOPS: $flops_gpu")`
			`end`

			`if (process_name != "warmup")`
			`push!(`
			`df,`
			`Dict(`
			`:process_name => process_name,`
			`:graph_gen_time => gen_time,`
			`:optimization_time => opt_time,`
			`:function_generation_time => func_time,`
			`:graph_nodes => graph_props.noNodes,`
			`:graph_edges => graph_props.noEdges,`
			`:graph_mem => MetagraphOptimization.mem(graph),`
			`:cpu_threads => Threads.nthreads(),`
			`:n_inputs => nInputs,`
			`:nflops_likwid => nflops_likwid,`
			`:cpu_time => time_cpu,`
			`:cpu_rate => rate_cpu,`
			`:cpu_gflops => flops_cpu,`
			`:gpu_name => gpu_name,`
			`:gpu_time => time_gpu,`
			`:gpu_rate => rate_gpu,`
			`:gpu_gflops => flops_gpu,`
			`),`
			`)`
			`end`

			`return nothing`
heterogeneity (#27) Prepare things to work with heterogeneity, make things work on GPU Reviewed-on: https://code.woubery.com/Rubydragon/MetagraphOptimization.jl/pulls/27 Co-authored-by: Anton Reinhard <anton.reinhard@proton.me> Co-committed-by: Anton Reinhard <anton.reinhard@proton.me> 2023-12-18 14:31:52 +01:00			`end`

			`# use "mock" machine that only uses cpu`
			`machine = Machine(`
			`[`
			`MetagraphOptimization.NumaNode(`
			`0,`
			`1,`
			`MetagraphOptimization.default_strategy(MetagraphOptimization.NumaNode),`
			`-1.0,`
			`UUIDs.uuid1(),`
			`),`
			`],`
			`[-1.0;;],`
			`)`

			`# sadly cannot put these in functions because the world age must increase after the function is created which happens only in the global scope`

Add qed bench run script and singularity container 2024-02-02 06:56:16 +01:00			`## -- WARMUP TO COMPILE FUNCTIONS first`

			`optimizer = RandomWalkOptimizer(MersenneTwister(0))`

			`# 2-photon compton`
			`process = parse_process("ke->kke", QEDModel())`
			`gen_time = @elapsed graph = gen_graph(process)`
			`opt_time = @elapsed optimize!(optimizer, graph, 200)`
			`func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)`
			`bench_process(process, "warmup", graph, compute_func, gen_time, opt_time, func_gen_time)`

			`optimizer = ReductionOptimizer()`

			`# AB->AB^3`
			`process = parse_process("AB->ABBB", ABCModel())`
			`gen_time = @elapsed graph = parse_dag("input/AB->ABBB.txt", ABCModel())`
			`opt_time = @elapsed optimize_to_fixpoint!(optimizer, graph)`
			`func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)`
			`bench_process(process, "warmup", graph, compute_func, gen_time, opt_time, func_gen_time)`

			`## -- WARMUP END`

			`optimizer = ReductionOptimizer()`

heterogeneity (#27) Prepare things to work with heterogeneity, make things work on GPU Reviewed-on: https://code.woubery.com/Rubydragon/MetagraphOptimization.jl/pulls/27 Co-authored-by: Anton Reinhard <anton.reinhard@proton.me> Co-committed-by: Anton Reinhard <anton.reinhard@proton.me> 2023-12-18 14:31:52 +01:00			`# compton`
			`process = parse_process("ke->ke", QEDModel())`
Add qed bench run script and singularity container 2024-02-02 06:56:16 +01:00			`gen_time = @elapsed graph = gen_graph(process)`
			`func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)`
			`bench_process(process, "$process no optimization", graph, compute_func, gen_time, 0.0, func_gen_time)`

			`opt_time = @elapsed optimize_to_fixpoint!(optimizer, graph)`
			`func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)`
			`bench_process(process, "$process reduced", graph, compute_func, gen_time, opt_time, func_gen_time)`
heterogeneity (#27) Prepare things to work with heterogeneity, make things work on GPU Reviewed-on: https://code.woubery.com/Rubydragon/MetagraphOptimization.jl/pulls/27 Co-authored-by: Anton Reinhard <anton.reinhard@proton.me> Co-committed-by: Anton Reinhard <anton.reinhard@proton.me> 2023-12-18 14:31:52 +01:00
			`# 2-photon compton`
			`process = parse_process("ke->kke", QEDModel())`
Add qed bench run script and singularity container 2024-02-02 06:56:16 +01:00			`gen_time = @elapsed graph = gen_graph(process)`
			`func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)`
			`bench_process(process, "$process no optimization", graph, compute_func, gen_time, 0.0, func_gen_time)`

			`opt_time = @elapsed optimize_to_fixpoint!(optimizer, graph)`
			`func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)`
			`bench_process(process, "$process reduced", graph, compute_func, gen_time, opt_time, func_gen_time)`
heterogeneity (#27) Prepare things to work with heterogeneity, make things work on GPU Reviewed-on: https://code.woubery.com/Rubydragon/MetagraphOptimization.jl/pulls/27 Co-authored-by: Anton Reinhard <anton.reinhard@proton.me> Co-committed-by: Anton Reinhard <anton.reinhard@proton.me> 2023-12-18 14:31:52 +01:00
			`# 3-photon compton`
			`process = parse_process("ke->kkke", QEDModel())`
Add qed bench run script and singularity container 2024-02-02 06:56:16 +01:00			`gen_time = @elapsed graph = gen_graph(process)`
			`func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)`
			`bench_process(process, "$process no optimization", graph, compute_func, gen_time, 0.0, func_gen_time)`

			`opt_time = @elapsed optimize_to_fixpoint!(optimizer, graph)`
			`func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)`
			`bench_process(process, "$process reduced", graph, compute_func, gen_time, opt_time, func_gen_time)`

			`# 4-photon compton`
			`process = parse_process("ke->kkkke", QEDModel())`
			`gen_time = @elapsed graph = gen_graph(process)`
			`func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)`
			`bench_process(process, "$process no optimization", graph, compute_func, gen_time, 0.0, func_gen_time, use_gpu = false)`

			`opt_time = @elapsed optimize_to_fixpoint!(optimizer, graph)`
			`func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)`
			`bench_process(process, "$process reduced", graph, compute_func, gen_time, opt_time, func_gen_time)`

			`# 5-photon compton`
			`process = parse_process("ke->kkkkke", QEDModel())`
			`gen_time = @elapsed graph = gen_graph(process)`
			`func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)`
			`bench_process(process, "$process no optimization", graph, compute_func, gen_time, 0.0, func_gen_time, use_gpu = false)`

			`opt_time = @elapsed optimize_to_fixpoint!(optimizer, graph)`
			`func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)`
			`bench_process(process, "$process reduced", graph, compute_func, gen_time, opt_time, func_gen_time, use_gpu = false)`

			`# 6-photon compton`
			`process = parse_process("ke->kkkkkke", QEDModel())`
			`gen_time = @elapsed graph = gen_graph(process)`
			`opt_time = @elapsed optimize_to_fixpoint!(optimizer, graph)`
			`func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)`
			`bench_process(process, "$process reduced", graph, compute_func, gen_time, opt_time, func_gen_time, use_gpu = false)`
heterogeneity (#27) Prepare things to work with heterogeneity, make things work on GPU Reviewed-on: https://code.woubery.com/Rubydragon/MetagraphOptimization.jl/pulls/27 Co-authored-by: Anton Reinhard <anton.reinhard@proton.me> Co-committed-by: Anton Reinhard <anton.reinhard@proton.me> 2023-12-18 14:31:52 +01:00
			`# AB->AB`
			`process = parse_process("AB->AB", ABCModel())`
Add qed bench run script and singularity container 2024-02-02 06:56:16 +01:00			`gen_time = @elapsed graph = parse_dag("input/AB->AB.txt", ABCModel())`
			`func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)`
			`bench_process(process, "$process no optimization", graph, compute_func, gen_time, 0.0, func_gen_time)`

			`opt_time = @elapsed optimize_to_fixpoint!(optimizer, graph)`
			`func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)`
			`bench_process(process, "$process reduced", graph, compute_func, gen_time, opt_time, func_gen_time)`
heterogeneity (#27) Prepare things to work with heterogeneity, make things work on GPU Reviewed-on: https://code.woubery.com/Rubydragon/MetagraphOptimization.jl/pulls/27 Co-authored-by: Anton Reinhard <anton.reinhard@proton.me> Co-committed-by: Anton Reinhard <anton.reinhard@proton.me> 2023-12-18 14:31:52 +01:00
			`# AB->AB^3`
			`process = parse_process("AB->ABBB", ABCModel())`
Add qed bench run script and singularity container 2024-02-02 06:56:16 +01:00			`gen_time = @elapsed graph = parse_dag("input/AB->ABBB.txt", ABCModel())`
			`func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)`
			`bench_process(process, "$process no optimization", graph, compute_func, gen_time, 0.0, func_gen_time)`
heterogeneity (#27) Prepare things to work with heterogeneity, make things work on GPU Reviewed-on: https://code.woubery.com/Rubydragon/MetagraphOptimization.jl/pulls/27 Co-authored-by: Anton Reinhard <anton.reinhard@proton.me> Co-committed-by: Anton Reinhard <anton.reinhard@proton.me> 2023-12-18 14:31:52 +01:00
Add qed bench run script and singularity container 2024-02-02 06:56:16 +01:00			`opt_time = @elapsed optimize_to_fixpoint!(optimizer, graph)`
			`func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)`
			`bench_process(process, "$process reduced", graph, compute_func, gen_time, opt_time, func_gen_time)`
heterogeneity (#27) Prepare things to work with heterogeneity, make things work on GPU Reviewed-on: https://code.woubery.com/Rubydragon/MetagraphOptimization.jl/pulls/27 Co-authored-by: Anton Reinhard <anton.reinhard@proton.me> Co-committed-by: Anton Reinhard <anton.reinhard@proton.me> 2023-12-18 14:31:52 +01:00
			`# AB->AB^5`
			`process = parse_process("AB->ABBBBB", ABCModel())`
Add qed bench run script and singularity container 2024-02-02 06:56:16 +01:00			`gen_time = @elapsed graph = parse_dag("input/AB->ABBBBB.txt", ABCModel())`
			`func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)`
			`bench_process(process, "$process no optimization", graph, compute_func, gen_time, 0.0, func_gen_time, use_gpu = false)`

			`opt_time = @elapsed optimize_to_fixpoint!(optimizer, graph)`
			`func_gen_time = @elapsed compute_func = get_compute_function(graph, process, machine)`
			`bench_process(process, "$process reduced", graph, compute_func, gen_time, opt_time, func_gen_time, use_gpu = false)`

			`CSV.write(results_filename, df)`