Name: Compare Onednn Perf Between Commits
Author: azhai219

스킬 검색.../

Compare Onednn Perf Between Commits | Skills Pool

# Base OpenVINO repo and two worktrees (recommended)
export OV_REF_REPO=/path/to/ref
export OV_BAD_REPO=/path/to/bad

export REF_COMMIT=<ref_commit>
export BAD_COMMIT=<bad_commit>

mkdir ${OV_REF_REPO}
cd ${OV_REF_REPO}
git clone https://github.com/openvinotoolkit/openvino.git
cd openvino
git reset --hard $REF_COMMIT
git submodule update --init --recursive
mkdir build
cd build
cmake .. -DCMAKE_BUILD_TYPE=RelWithDebInfo
make -j$(nproc)

export MODEL_XML=<model>

# COMMIT A
cd "$OV_REF_REPO"
source venv/ov/bin/activate
benchmark_app -m "$MODEL_XML" -d "$DEVICE" -hint latency -t 10 -niter 1000 \
	${SHAPE:+-shape "$SHAPE"} \
	> "$OUT/A/bench_latency.log" 2>&1
deactivate

# COMMIT B
cd "$OV_BAD_REPO"
source venv/ov/bin/activate
benchmark_app -m "$MODEL_XML" -d "$DEVICE" -hint latency -t 10 -niter 1000 \
	${SHAPE:+-shape "$SHAPE"} \
	> "$OUT/B/bench_latency.log" 2>&1
deactivate

grep -E "Latency|Average|Median|percentile" "$OUT/A/bench_latency.log" | tee "$OUT/A/latency_summary.txt"
grep -E "Latency|Average|Median|percentile" "$OUT/B/bench_latency.log" | tee "$OUT/B/latency_summary.txt"

# COMMIT A (repeat same in B)
cd "$OV_REF_REPO"
source venv/ov/bin/activate

benchmark_app -m "$MODEL_XML" -d "$DEVICE" -hint latency -t 30 -niter 300 -pc \
	${SHAPE:+-shape "$SHAPE"} \
	> "$OUT/A/pc_node.log" 2>&1

grep -E "^\[ INFO \] +[0-9]+ +[0-9.]+ +[0-9.]+ +.*" "$OUT/A/pc_node.log" | tail -n +1 > "$OUT/A/pc_nodes.txt"
grep -E "^\[ INFO \] +[0-9]+ +[0-9.]+ +[0-9.]+ +.*" "$OUT/B/pc_node.log" | tail -n +1 > "$OUT/B/pc_nodes.txt"

# COMMIT A (repeat same in B)
cd "$OV_REF_REPO"
source venv/ov/bin/activate

OV_CPU_VERBOSE=1 ONEDNN_VERBOSE=all \
benchmark_app -m "$MODEL_XML" -d "$DEVICE" -hint latency -t 30 -niter 300 -pc \
	${SHAPE:+-shape "$SHAPE"} \
	> "$OUT/A/pc_verbose.log" 2>&1

# Full logs already in pc_verbose.log. Extract oneDNN lines:
grep '^onednn_verbose,' "$OUT/A/pc_verbose.log" > "$OUT/A/onednn_full.log"
grep '^onednn_verbose,' "$OUT/B/pc_verbose.log" > "$OUT/B/onednn_full.log"

# Example: focus on matmul/ip/reorder that usually dominate LLM workloads
grep -E 'onednn_verbose,(exec|create),cpu,(matmul|inner_product|reorder),' "$OUT/A/onednn_full.log" > "$OUT/A/onednn_focus.log"
grep -E 'onednn_verbose,(exec|create),cpu,(matmul|inner_product|reorder),' "$OUT/B/onednn_full.log" > "$OUT/B/onednn_focus.log"

grep 'mb1ic4096oc4096' "$OUT/A/onednn_focus.log" > "$OUT/A/onednn_target.log"
grep 'mb1ic4096oc4096' "$OUT/B/onednn_focus.log" > "$OUT/B/onednn_target.log"

# Branch A
cd "$BR_A/src/plugins/intel_cpu/thirdparty/onednn"
cmake -S . -B build-release \
	-DCMAKE_BUILD_TYPE=Release \
	-DDNNL_BUILD_TESTS=ON \
	-DDNNL_BUILD_EXAMPLES=OFF
cmake --build build-release --target benchdnn -j"$(nproc)"

# Branch B
cd "$BR_B/src/plugins/intel_cpu/thirdparty/onednn"
cmake -S . -B build-release \
	-DCMAKE_BUILD_TYPE=Release \
	-DDNNL_BUILD_TESTS=ON \
	-DDNNL_BUILD_EXAMPLES=OFF
cmake --build build-release --target benchdnn -j"$(nproc)"

# Branch A
cd "$OUT/A"
python3 "$BR_A/src/plugins/intel_cpu/thirdparty/onednn/scripts/verbose_converter/verbose_converter.py" \
	-i onednn_focus.log \
	-o onednn_cases.cmd

# Branch B
cd "$OUT/B"
python3 "$BR_B/src/plugins/intel_cpu/thirdparty/onednn/scripts/verbose_converter/verbose_converter.py" \
	-i onednn_focus.log \
	-o onednn_cases.cmd

# COMMIT A.
# for example, $cmd_a is in "$OUT/A/onednn_cases.cmd"
cd "$BR_A/src/plugins/intel_cpu/thirdparty/onednn"
./build-release/tests/benchdnn/benchdnn --mode=P cmd_a

# COMMIT B
# for example, $cmd_b is in "$OUT/B/onednn_cases.cmd"
cd "$BR_B/src/plugins/intel_cpu/thirdparty/onednn"
./build-release/tests/benchdnn/benchdnn --mode=P cmd_b

Compare Onednn Perf Between Commits

Compare Model Performance Between Two Branches (OpenVINO → oneDNN)

Goal

Required Inputs

Expected Outputs

Compare Onednn Perf Between Commits

Compare Model Performance Between Two Branches (OpenVINO → oneDNN)

Goal

Required Inputs

Expected Outputs

Download model from the website, and put the model in the local disk.

Variables (set once)

1) Reproduce performance gap with `benchmark_app` in latency mode

2) Turn on PC + verbose to locate specific nodes

3) Dump specific `onednn_verbose` for found nodes

4) Build oneDNN (Release) in each branch

5) Convert verbose to benchdnn command(s)

6) Reproduce the gap with oneDNN `benchdnn`

Compare Results

Nanoclaw Repl

Bioinformatics

Smart Explore

Vector Database Engineer

Skin Health Analyzer

Scanpy

Compare Onednn Perf Between Commits

Compare Model Performance Between Two Branches (OpenVINO → oneDNN)

Goal

Required Inputs

Expected Outputs

Compare Onednn Perf Between Commits

Compare Model Performance Between Two Branches (OpenVINO → oneDNN)

Goal

Required Inputs

Expected Outputs

Download model from the website, and put the model in the local disk.

Variables (set once)

1) Reproduce performance gap with benchmark_app in latency mode

2) Turn on PC + verbose to locate specific nodes

3) Dump specific onednn_verbose for found nodes

4) Build oneDNN (Release) in each branch

5) Convert verbose to benchdnn command(s)

6) Reproduce the gap with oneDNN benchdnn

Compare Results

Nanoclaw Repl

Bioinformatics

Smart Explore

Vector Database Engineer

Skin Health Analyzer

Scanpy

1) Reproduce performance gap with `benchmark_app` in latency mode

3) Dump specific `onednn_verbose` for found nodes

6) Reproduce the gap with oneDNN `benchdnn`