Skip to content

Commit

Permalink
feature: Add automated benchmarking to GitHub (#35)
Browse files Browse the repository at this point in the history
* change: nobraket branch

* change: Use multiprocessing Pool rather than ProcessPoolExecutor

* feature: Add automated benchmarking to GitHub

* fix: Use mmap for statevector for performance boost

* fix: Working tests and benchmarks

* fix: Point to correct branch

* fix: Linters

* change: Point at new tagged version

* fix: Lower maximum qubit count for GH

* fix: Benchmark workflow

* fix: Don't commit the output file
  • Loading branch information
kshyatt-aws authored Oct 7, 2024
1 parent c46167a commit c5e9bcd
Show file tree
Hide file tree
Showing 6 changed files with 247 additions and 39 deletions.
45 changes: 45 additions & 0 deletions .github/workflows/benchmark.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,45 @@
name: Benchmark

on:
push:
branches: [ main ]
pull_request:

jobs:
benchmark:
runs-on: ubuntu-latest
timeout-minutes: 30
steps:
- uses: actions/checkout@v4
- name: Install juliaup
uses: julia-actions/install-juliaup@v2.1.2
with:
channel: '1'
- name: Update Julia registry
shell: julia --project=. --color=yes {0}
run: |
using Pkg
Pkg.Registry.update()
- name: Set up Python
uses: actions/setup-python@v5
with:
python-version: 3.9
- name: Install dependencies
run: |
pip install -e .[test] # to put juliapkg.json in sys.path
python -c 'import juliacall' # force install of all deps
- name: Benchmark
run: |
pytest -n 0 benchmark/benchmark.py --benchmark-json=benchmark/output.json
- name: Store benchmark result
uses: benchmark-action/github-action-benchmark@v1
with:
name: Python Benchmark with pytest-benchmark
tool: 'pytest'
output-file-path: benchmark/output.json
github-token: ${{ secrets.GITHUB_TOKEN }}
auto-push: true
# Show alert with commit comment on detecting possible performance regression
alert-threshold: '200%'
comment-on-alert: true
fail-on-alert: true
151 changes: 151 additions & 0 deletions benchmark/benchmark.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,151 @@
import numpy as np
import pytest
from braket.devices import LocalSimulator
from braket.ir.openqasm import Program

# always the same for repeatability
np.random.seed(0x1C2C6D66)

batch_size = (10, 100)
n_qubits = range(3, 16)
exact_shots_results = (
"state_vector",
"density_matrix q[0], q[1]",
"probability",
"expectation z(q[0])",
"variance y(q[0])",
)
nonzero_shots_results = (
"probability",
"expectation z(q[0])",
"variance y(q[0])",
"sample z(q[0])",
)


def ghz(nq: int, result_type: str):
source = f"OPENQASM 3.0;\nqubit[{nq}] q;\nh q[0];\n"
for q in range(1, nq - 1):
source += f"cnot q[0], q[{q}];\n"

source += f"#pragma braket result {result_type}\n"
return source


def qft(nq: int, result_type: str):
source = f"OPENQASM 3.0;\nqubit[{nq}] q;\n"
for q in range(nq - 1):
angle = np.pi / 2.0
source += f"h q[{q}];\n"
for ctrl_q in range(q + 1, nq - 1):
source += f"cphaseshift({angle}) q[{ctrl_q}], q[{q}];\n"
angle /= 2.0

source += f"#pragma braket result {result_type}\n"
return source


def run_sim(oq3_prog, sim, shots):
sim.run(oq3_prog, shots=shots)
return


def run_sim_batch(oq3_prog, sim, shots):
sim.run_batch(oq3_prog, shots=shots)
return


device_ids = ("braket_sv", "braket_sv_v2", "braket_dm", "braket_dm_v2")

generators = (ghz, qft)


@pytest.mark.parametrize("device_id", device_ids)
@pytest.mark.parametrize("nq", n_qubits)
@pytest.mark.parametrize("exact_results", exact_shots_results)
@pytest.mark.parametrize("circuit", generators)
def test_exact_shots(benchmark, device_id, nq, exact_results, circuit):
if device_id in ("braket_dm_v2", "braket_dm") and (
exact_results in ("state_vector",) or nq > 10
):
pytest.skip()
if (
device_id in ("braket_sv",)
and exact_results in ("density_matrix q[0], q[1]",)
and nq >= 17
):
pytest.skip()
result_type = exact_results
oq3_prog = Program(source=circuit(nq, result_type))
sim = LocalSimulator(device_id)
benchmark.pedantic(run_sim, args=(oq3_prog, sim, 0), iterations=5, warmup_rounds=1)


@pytest.mark.parametrize("device_id", device_ids)
@pytest.mark.parametrize("nq", n_qubits)
@pytest.mark.parametrize("batch_size", batch_size)
@pytest.mark.parametrize("exact_results", exact_shots_results)
@pytest.mark.parametrize("circuit", generators)
def test_exact_shots_batched(
benchmark, device_id, nq, batch_size, exact_results, circuit
):
if device_id in ("braket_dm_v2", "braket_dm") and (
exact_results in ("state_vector,") or nq >= 5
):
pytest.skip()
if nq >= 10:
pytest.skip()
# skip all for now as this is very expensive
pytest.skip()
result_type = exact_results
oq3_prog = [Program(source=circuit(nq, result_type)) for _ in range(batch_size)]
sim = LocalSimulator(device_id)
benchmark.pedantic(
run_sim_batch, args=(oq3_prog, sim, 0), iterations=5, warmup_rounds=1
)


shots = (100,)


@pytest.mark.parametrize("device_id", device_ids)
@pytest.mark.parametrize("nq", n_qubits)
@pytest.mark.parametrize("shots", shots)
@pytest.mark.parametrize("nonzero_shots_results", nonzero_shots_results)
@pytest.mark.parametrize("circuit", generators)
def test_nonzero_shots(benchmark, device_id, nq, shots, nonzero_shots_results, circuit):
if device_id in ("braket_dm_v2", "braket_dm") and nq > 10:
pytest.skip()
result_type = nonzero_shots_results
oq3_prog = Program(source=circuit(nq, result_type))
sim = LocalSimulator(device_id)
benchmark.pedantic(
run_sim, args=(oq3_prog, sim, shots), iterations=5, warmup_rounds=1
)
del sim


@pytest.mark.parametrize("device_id", device_ids)
@pytest.mark.parametrize("nq", n_qubits)
@pytest.mark.parametrize("batch_size", batch_size)
@pytest.mark.parametrize("shots", shots)
@pytest.mark.parametrize("nonzero_shots_results", nonzero_shots_results)
@pytest.mark.parametrize("circuit", generators)
def test_nonzero_shots_batched(
benchmark, device_id, nq, batch_size, shots, nonzero_shots_results, circuit
):
if device_id in ("braket_dm_v2", "braket_dm") and nq >= 5:
pytest.skip()
if nq >= 10:
pytest.skip()

# skip all for now as this is very expensive
pytest.skip()

result_type = nonzero_shots_results
oq3_prog = [Program(source=circuit(nq, result_type)) for _ in range(batch_size)]
sim = LocalSimulator(device_id)
benchmark.pedantic(
run_sim_batch, args=(oq3_prog, sim, shots), iterations=5, warmup_rounds=1
)
del sim
2 changes: 1 addition & 1 deletion requirements.txt
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
juliacall==0.9.22
juliacall==0.9.23
numpy
amazon-braket-schemas>=1.20.2
amazon-braket-sdk>=1.83.0
4 changes: 2 additions & 2 deletions src/braket/juliapkg.json
Original file line number Diff line number Diff line change
@@ -1,9 +1,9 @@
{
"julia": "1.9",
"julia": "1.10",
"packages": {
"BraketSimulator": {
"uuid": "76d27892-9a0b-406c-98e4-7c178e9b3dff",
"version": "0.0.4"
"version": "0.0.5"
},
"JSON3": {
"uuid": "0f8b85d8-7281-11e9-16c2-39a750bddbf1",
Expand Down
77 changes: 43 additions & 34 deletions src/braket/simulator_v2/base_simulator_v2.py
Original file line number Diff line number Diff line change
Expand Up @@ -26,7 +26,7 @@ def setup_julia():
# don't reimport if we don't have to
if "juliacall" in sys.modules:
os.environ["PYTHON_JULIACALL_HANDLE_SIGNALS"] = "yes"
return sys.modules["juliacall"].Main
return
else:
for k, default in (
("PYTHON_JULIACALL_HANDLE_SIGNALS", "yes"),
Expand All @@ -40,40 +40,19 @@ def setup_julia():
import juliacall

jl = juliacall.Main
jl.seval("using JSON3, BraketSimulator")
sv_stock_oq3 = """
OPENQASM 3.0;
input float theta;
qubit[2] q;
h q[0];
cnot q;
x q[0];
xx(theta) q;
yy(theta) q;
zz(theta) q;
#pragma braket result expectation z(q[0])
"""
dm_stock_oq3 = """
jl.seval("using BraketSimulator, JSON3")
stock_oq3 = """
OPENQASM 3.0;
input float theta;
qubit[2] q;
h q[0];
x q[0];
cphaseshift(1.5707963267948966) q[1], q[0];
cnot q;
xx(theta) q;
yy(theta) q;
zz(theta) q;
#pragma braket noise bit_flip(0.1) q[0]
#pragma braket result variance y(q[0])
#pragma braket result density_matrix q[0], q[1]
#pragma braket result probability
"""
r = jl.BraketSimulator.simulate(
"braket_sv_v2", sv_stock_oq3, '{"theta": 0.1}', 0
)
jl.JSON3.write(r)
r = jl.BraketSimulator.simulate(
"braket_dm_v2", dm_stock_oq3, '{"theta": 0.1}', 0
)
jl.JSON3.write(r)
jl.BraketSimulator.simulate("braket_dm_v2", stock_oq3, "{}", 0)
return


Expand All @@ -86,6 +65,29 @@ def setup_pool():
return


def _handle_mmaped_result(raw_result, mmap_paths, obj_lengths):
result = GateModelTaskResult(**raw_result)
if mmap_paths:
mmap_files = mmap_paths
array_lens = obj_lengths
mmap_index = 0
for result_ind, result_type in enumerate(result.resultTypes):
if not result_type.value:
d_type = (
np.complex128
if isinstance(result_type.type, (DensityMatrix, StateVector))
else np.float64
)
result.resultTypes[result_ind].value = np.memmap(
mmap_files[mmap_index],
dtype=d_type,
mode="r",
shape=(array_lens[mmap_index],),
)
mmap_index += 1
return result


class BaseLocalSimulatorV2(BaseLocalSimulator):
def __init__(self, device: str):
global __JULIA_POOL__
Expand Down Expand Up @@ -126,8 +128,8 @@ def run_openqasm(
except Exception as e:
_handle_julia_error(e)

result = GateModelTaskResult(**json.loads(jl_result))
jl_result = None
loaded_result = json.loads(jl_result[0])
result = _handle_mmaped_result(loaded_result, jl_result[1], jl_result[2])
result.additionalMetadata.action = openqasm_ir

# attach the result types
Expand Down Expand Up @@ -165,8 +167,15 @@ def run_multiple(
except Exception as e:
_handle_julia_error(e)

loaded_result = json.loads(jl_results[0])
paths_and_lens = json.loads(jl_results[1])
results_paths_lens = [
(loaded_result[r_ix], paths_and_lens[r_ix][0], paths_and_lens[r_ix][1])
for r_ix in range(len(loaded_result))
]
results = [
GateModelTaskResult(**json.loads(jl_result)) for jl_result in jl_results
_handle_mmaped_result(*result_path_len)
for result_path_len in results_paths_lens
]
jl_results = None
for p_ix, program in enumerate(programs):
Expand Down Expand Up @@ -204,9 +213,9 @@ def reconstruct_complex(v):
}
if isinstance(result_type.type, StateVector):
val = task_result.resultTypes[result_ind].value
# complex are stored as tuples of reals
fixed_val = [reconstruct_complex(v) for v in val]
task_result.resultTypes[result_ind].value = np.asarray(fixed_val)
if isinstance(val, list):
fixed_val = [reconstruct_complex(v) for v in val]
task_result.resultTypes[result_ind].value = np.asarray(fixed_val)
if isinstance(result_type.type, DensityMatrix):
val = task_result.resultTypes[result_ind].value
# complex are stored as tuples of reals
Expand Down
7 changes: 5 additions & 2 deletions src/braket/simulator_v2/julia_workers.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,7 @@

def _handle_julia_error(error):
# in case juliacall isn't loaded
print(error)
if type(error).__name__ == "JuliaError":
python_exception = getattr(error.exception, "alternate_type", None)
if python_exception is None:
Expand All @@ -29,18 +30,20 @@ def translate_and_run(
device_id: str, openqasm_ir: OpenQASMProgram, shots: int = 0
) -> str:
jl = sys.modules["juliacall"].Main
jl_shots = shots
jl.GC.enable(False)
jl_inputs = json.dumps(openqasm_ir.inputs) if openqasm_ir.inputs else "{}"
try:
result = jl.BraketSimulator.simulate(
device_id,
openqasm_ir.source,
jl_inputs,
jl_shots,
shots,
)

except Exception as e:
_handle_julia_error(e)
finally:
jl.GC.enable(True)

return result

Expand Down

1 comment on commit c5e9bcd

@github-actions
Copy link

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

⚠️ Performance Alert ⚠️

Possible performance regression was detected for benchmark 'Python Benchmark with pytest-benchmark'.
Benchmark result of this commit is worse than the previous benchmark result exceeding threshold 2.

Benchmark suite Current: c5e9bcd Previous: 85f2ac1 Ratio
benchmark/benchmark.py::test_exact_shots[ghz-variance y(q[0])-5-braket_dm] 47.12688317610862 iter/sec (stddev: 0) 126.67564965919034 iter/sec (stddev: 0) 2.69
benchmark/benchmark.py::test_exact_shots[ghz-variance y(q[0])-7-braket_dm_v2] 129.69355798623124 iter/sec (stddev: 0) 314.06175057039223 iter/sec (stddev: 0) 2.42
benchmark/benchmark.py::test_exact_shots[qft-density_matrix q[0], q[1]-7-braket_dm_v2] 87.64308105463063 iter/sec (stddev: 0) 266.50541312508136 iter/sec (stddev: 0) 3.04
benchmark/benchmark.py::test_exact_shots[qft-variance y(q[0])-7-braket_dm_v2] 71.77157393221735 iter/sec (stddev: 0) 216.9578320323035 iter/sec (stddev: 0) 3.02
benchmark/benchmark.py::test_nonzero_shots[ghz-expectation z(q[0])-100-12-braket_sv] 36.85871674963592 iter/sec (stddev: 0) 77.28683394669166 iter/sec (stddev: 0) 2.10
benchmark/benchmark.py::test_nonzero_shots[ghz-sample z(q[0])-100-14-braket_sv] 32.64162296029481 iter/sec (stddev: 0) 69.25562955118954 iter/sec (stddev: 0) 2.12
benchmark/benchmark.py::test_nonzero_shots[qft-probability-100-12-braket_sv_v2] 41.04276229808575 iter/sec (stddev: 0) 120.90650474087754 iter/sec (stddev: 0) 2.95
benchmark/benchmark.py::test_nonzero_shots[qft-variance y(q[0])-100-7-braket_dm_v2] 40.14938171679087 iter/sec (stddev: 0) 97.51415359436345 iter/sec (stddev: 0) 2.43
benchmark/benchmark.py::test_nonzero_shots[qft-sample z(q[0])-100-4-braket_sv] 36.76165196218521 iter/sec (stddev: 0) 106.73945899272341 iter/sec (stddev: 0) 2.90

This comment was automatically generated by workflow using github-action-benchmark.

Please sign in to comment.