Skip to content

Commit c7ee1a5

Browse files
Implement end to end benchmark (#6910)
1 parent 2725202 commit c7ee1a5

7 files changed

+261
-10
lines changed

.github/workflows/osrm-backend.yml

Lines changed: 18 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -377,12 +377,11 @@ jobs:
377377
key: v4-test-${{ matrix.name }}-${{ github.sha }}
378378
restore-keys: |
379379
v4-test-${{ matrix.name }}-
380-
381380
- name: Prepare environment
382381
run: |
383382
echo "CCACHE_DIR=$HOME/.ccache" >> $GITHUB_ENV
384383
mkdir -p $HOME/.ccache
385-
384+
386385
PACKAGE_JSON_VERSION=$(node -e "console.log(require('./package.json').version)")
387386
echo PUBLISH=$([[ "${GITHUB_REF:-}" == "refs/tags/v${PACKAGE_JSON_VERSION}" ]] && echo "On" || echo "Off") >> $GITHUB_ENV
388387
echo "OSRM_INSTALL_DIR=${GITHUB_WORKSPACE}/install-osrm" >> $GITHUB_ENV
@@ -490,7 +489,7 @@ jobs:
490489
run: |
491490
echo "Using ${JOBS} jobs"
492491
pushd ${OSRM_BUILD_DIR}
493-
492+
494493
ccache --zero-stats
495494
cmake .. -DCMAKE_BUILD_TYPE=${BUILD_TYPE} \
496495
-DENABLE_CONAN=${ENABLE_CONAN:-OFF} \
@@ -508,6 +507,7 @@ jobs:
508507
if [[ "${NODE_PACKAGE_TESTS_ONLY}" != "ON" ]]; then
509508
make tests --jobs=${JOBS}
510509
make benchmarks --jobs=${JOBS}
510+
511511
sudo make install
512512
if [[ "${RUNNER_OS}" == "Linux" ]]; then
513513
echo "LD_LIBRARY_PATH=$LD_LIBRARY_PATH:${OSRM_INSTALL_DIR}/lib" >> $GITHUB_ENV
@@ -628,6 +628,13 @@ jobs:
628628
PR_NUMBER: ${{ github.event.pull_request.number }}
629629
GITHUB_REPOSITORY: ${{ github.repository }}
630630
steps:
631+
- name: Enable data.osm.pbf cache
632+
uses: actions/cache@v4
633+
with:
634+
path: ~/data.osm.pbf
635+
key: v1-data-osm-pbf
636+
restore-keys: |
637+
v1-data-osm-pbf
631638
- name: Enable compiler cache
632639
uses: actions/cache@v4
633640
with:
@@ -648,9 +655,15 @@ jobs:
648655
ref: ${{ github.head_ref }}
649656
path: pr
650657
- name: Install dependencies
651-
run: |
652-
python3 -m pip install "conan<2.0.0" "requests==2.31.0"
658+
run: |
659+
python3 -m pip install "conan<2.0.0" "requests==2.31.0" "locust==2.28.0"
653660
sudo apt-get update -y && sudo apt-get install ccache
661+
- name: Prepare data
662+
run: |
663+
if [ ! -f "~/data.osm.pbf" ]; then
664+
wget http://download.geofabrik.de/europe/germany/berlin-latest.osm.pbf -O ~/data.osm.pbf
665+
fi
666+
gunzip -c ./pr/test/data/berlin_gps_traces.csv.gz > ~/gps_traces.csv
654667
- name: Prepare environment
655668
run: |
656669
echo "CCACHE_DIR=$HOME/.ccache" >> $GITHUB_ENV

scripts/ci/download_gps_traces.py

Lines changed: 91 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,91 @@
1+
import requests
2+
import xml.etree.ElementTree as ET
3+
import csv
4+
import sys
5+
import argparse
6+
7+
def get_osm_gps_traces(min_lon, min_lat, max_lon, max_lat):
8+
url = 'https://api.openstreetmap.org/api/0.6/trackpoints'
9+
traces = []
10+
11+
lon_step = 0.25
12+
lat_step = 0.25
13+
14+
current_min_lon = min_lon
15+
16+
while current_min_lon < max_lon:
17+
current_max_lon = min(current_min_lon + lon_step, max_lon)
18+
19+
current_min_lat = min_lat
20+
while current_min_lat < max_lat:
21+
current_max_lat = min(current_min_lat + lat_step, max_lat)
22+
23+
bbox = f'{current_min_lon},{current_min_lat},{current_max_lon},{current_max_lat}'
24+
print(f"Requesting bbox: {bbox}", file=sys.stderr)
25+
26+
params = {
27+
'bbox': bbox,
28+
'page': 0
29+
}
30+
headers = {
31+
'Accept': 'application/xml'
32+
}
33+
34+
response = requests.get(url, params=params, headers=headers)
35+
if response.status_code == 200:
36+
traces.append(response.content)
37+
else:
38+
print(f"Error fetching data for bbox {bbox}: {response.status_code} {response.text}", file=sys.stderr)
39+
40+
current_min_lat += lat_step
41+
current_min_lon += lon_step
42+
43+
return traces
44+
45+
def parse_gpx_data(gpx_data):
46+
try:
47+
root = ET.fromstring(gpx_data)
48+
except ET.ParseError as e:
49+
print(f"Error parsing GPX data: {e}", file=sys.stderr)
50+
return []
51+
namespace = {'gpx': 'http://www.topografix.com/GPX/1/0'}
52+
53+
tracks = []
54+
for trk in root.findall('.//gpx:trk', namespace):
55+
track_data = []
56+
for trkseg in trk.findall('.//gpx:trkseg', namespace):
57+
for trkpt in trkseg.findall('gpx:trkpt', namespace):
58+
lat = trkpt.get('lat')
59+
lon = trkpt.get('lon')
60+
time = trkpt.find('time').text if trkpt.find('time') is not None else ''
61+
track_data.append([lat, lon, time])
62+
tracks.append(track_data)
63+
return tracks
64+
65+
def save_to_csv(data, file):
66+
writer = csv.writer(file)
67+
writer.writerow(['TrackID', 'Latitude', 'Longitude', 'Time'])
68+
writer.writerows(data)
69+
70+
if __name__ == '__main__':
71+
parser = argparse.ArgumentParser(description='Fetch and output OSM GPS traces for a given bounding box.')
72+
parser.add_argument('min_lon', type=float, help='Minimum longitude of the bounding box')
73+
parser.add_argument('min_lat', type=float, help='Minimum latitude of the bounding box')
74+
parser.add_argument('max_lon', type=float, help='Maximum longitude of the bounding box')
75+
parser.add_argument('max_lat', type=float, help='Maximum latitude of the bounding box')
76+
77+
args = parser.parse_args()
78+
79+
gpx_data_traces = get_osm_gps_traces(args.min_lon, args.min_lat, args.max_lon, args.max_lat)
80+
print(f"Collected {len(gpx_data_traces)} trace segments", file=sys.stderr)
81+
82+
all_data = []
83+
track_id = 0
84+
for gpx_data in gpx_data_traces:
85+
for track in parse_gpx_data(gpx_data):
86+
for point in track:
87+
all_data.append([track_id] + point)
88+
track_id += 1
89+
90+
# Output all data to stdout
91+
save_to_csv(all_data, sys.stdout)

scripts/ci/locustfile.py

Lines changed: 74 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,74 @@
1+
from locust import HttpUser, TaskSet, task, between
2+
import csv
3+
import random
4+
from collections import defaultdict
5+
import os
6+
7+
class OSRMTasks(TaskSet):
8+
def on_start(self):
9+
random.seed(42)
10+
11+
self.coordinates = []
12+
self.tracks = defaultdict(list)
13+
14+
gps_traces_file_path = os.path.expanduser('~/gps_traces.csv')
15+
with open(gps_traces_file_path, 'r') as file:
16+
reader = csv.DictReader(file)
17+
for row in reader:
18+
coord = (float(row['Latitude']), float(row['Longitude']))
19+
self.coordinates.append(coord)
20+
self.tracks[row['TrackID']].append(coord)
21+
self.track_ids = list(self.tracks.keys())
22+
23+
@task
24+
def get_route(self):
25+
start = random.choice(self.coordinates)
26+
end = random.choice(self.coordinates)
27+
28+
start_coord = f"{start[1]:.6f},{start[0]:.6f}"
29+
end_coord = f"{end[1]:.6f},{end[0]:.6f}"
30+
31+
self.client.get(f"/route/v1/driving/{start_coord};{end_coord}?overview=full&steps=true", name="route")
32+
33+
@task
34+
def get_table(self):
35+
num_coords = random.randint(3, 100)
36+
selected_coords = random.sample(self.coordinates, num_coords)
37+
coords_str = ";".join([f"{coord[1]:.6f},{coord[0]:.6f}" for coord in selected_coords])
38+
39+
self.client.get(f"/table/v1/driving/{coords_str}", name="table")
40+
41+
@task
42+
def get_match(self):
43+
num_coords = random.randint(50, 100)
44+
track_id = random.choice(self.track_ids)
45+
track_coords = self.tracks[track_id][:num_coords]
46+
coords_str = ";".join([f"{coord[1]:.6f},{coord[0]:.6f}" for coord in track_coords])
47+
radiues_str = ";".join([f"{random.randint(5, 20)}" for _ in range(len(track_coords))])
48+
49+
with self.client.get(f"/match/v1/driving/{coords_str}?steps=true&radiuses={radiues_str}", name="match", catch_response=True) as response:
50+
if response.status_code == 400:
51+
j = response.json()
52+
# it is expected that some of requests will fail with such error: map matching fails sometimes
53+
if j['code'] == 'NoSegment' or j['code'] == 'NoMatch':
54+
response.success()
55+
56+
@task
57+
def get_nearest(self):
58+
coord = random.choice(self.coordinates)
59+
coord_str = f"{coord[1]:.6f},{coord[0]:.6f}"
60+
61+
self.client.get(f"/nearest/v1/driving/{coord_str}", name="nearest")
62+
63+
@task
64+
def get_trip(self):
65+
num_coords = random.randint(2, 10)
66+
selected_coords = random.sample(self.coordinates, num_coords)
67+
coords_str = ";".join([f"{coord[1]:.6f},{coord[0]:.6f}" for coord in selected_coords])
68+
69+
self.client.get(f"/trip/v1/driving/{coords_str}?steps=true", name="trip")
70+
71+
class OSRMUser(HttpUser):
72+
tasks = [OSRMTasks]
73+
# random wait time between requests to not load server for 100%
74+
wait_time = between(0.05, 0.5)

scripts/ci/post_benchmark_results.py

Lines changed: 12 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -16,8 +16,10 @@ def create_markdown_table(results):
1616
rows = []
1717
for result in results:
1818
name = result['name']
19-
base = result['base'].replace('\n', '<br/>')
20-
pr = result['pr'].replace('\n', '<br/>')
19+
base = result['base'] or ''
20+
base = base.replace('\n', '<br/>')
21+
pr = result['pr'] or ''
22+
pr = pr.replace('\n', '<br/>')
2123
row = f"| {name} | {base} | {pr} |"
2224
rows.append(row)
2325
return f"{header}\n" + "\n".join(rows)
@@ -75,7 +77,14 @@ def main():
7577
pr_body = pr_details.get('body', '') or ''
7678

7779
markdown_table = create_markdown_table(benchmark_results)
78-
new_benchmark_section = f"<!-- BENCHMARK_RESULTS_START -->\n## Benchmark Results\n{markdown_table}\n<!-- BENCHMARK_RESULTS_END -->"
80+
new_benchmark_section = f"""
81+
<!-- BENCHMARK_RESULTS_START -->
82+
<details><summary><h2>Benchmark Results</h2></summary>
83+
84+
{markdown_table}
85+
</details>
86+
<!-- BENCHMARK_RESULTS_END -->
87+
"""
7988

8089
if re.search(r'<!-- BENCHMARK_RESULTS_START -->.*<!-- BENCHMARK_RESULTS_END -->', pr_body, re.DOTALL):
8190
updated_body = re.sub(
Lines changed: 31 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,31 @@
1+
import sys
2+
import csv
3+
4+
def main(locust_csv_base_name, suffix, output_folder):
5+
with open(f"{locust_csv_base_name}_stats.csv", 'r') as file:
6+
reader = csv.DictReader(file)
7+
for row in reader:
8+
name = row['Name']
9+
if name == 'Aggregated': continue
10+
11+
statistics = f'''
12+
requests: {row['Request Count']}
13+
failures: {row['Failure Count']}
14+
req/s: {float(row['Requests/s']):.3f}req/s
15+
avg: {float(row['Average Response Time']):.3f}ms
16+
50%: {row['50%']}ms
17+
75%: {row['75%']}ms
18+
95%: {row['95%']}ms
19+
98%: {row['98%']}ms
20+
99%: {row['99%']}ms
21+
min: {float(row['Min Response Time']):.3f}ms
22+
max: {float(row['Max Response Time']):.3f}ms
23+
'''
24+
with open(f"{output_folder}/e2e_{name}_{suffix}.bench", 'w') as f:
25+
f.write(statistics)
26+
27+
if __name__ == '__main__':
28+
if len(sys.argv) != 4:
29+
print(f"Usage: {sys.argv[0]} <locust csv base name> <suffix> <output folder>")
30+
sys.exit(1)
31+
main(sys.argv[1], sys.argv[2], sys.argv[3])

scripts/ci/run_benchmarks.sh

Lines changed: 35 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -13,12 +13,45 @@ function run_benchmarks_for_folder {
1313

1414
./$BENCHMARKS_FOLDER/match-bench "./$FOLDER/test/data/mld/monaco.osrm" mld > "$RESULTS_FOLDER/match_mld.bench"
1515
./$BENCHMARKS_FOLDER/match-bench "./$FOLDER/test/data/ch/monaco.osrm" ch > "$RESULTS_FOLDER/match_ch.bench"
16-
./$BENCHMARKS_FOLDER/route-bench "./$FOLDER/test/data/mld/monaco.osrm" mld > "$RESULTS_FOLDER/route_mld.bench" || true # TODO: remove `true` when this benchmark will be merged to master
17-
./$BENCHMARKS_FOLDER/route-bench "./$FOLDER/test/data/ch/monaco.osrm" ch > "$RESULTS_FOLDER/route_ch.bench" || true # TODO: remove `true` when this benchmark will be merged to master
16+
./$BENCHMARKS_FOLDER/route-bench "./$FOLDER/test/data/mld/monaco.osrm" mld > "$RESULTS_FOLDER/route_mld.bench"
17+
./$BENCHMARKS_FOLDER/route-bench "./$FOLDER/test/data/ch/monaco.osrm" ch > "$RESULTS_FOLDER/route_ch.bench"
1818
./$BENCHMARKS_FOLDER/alias-bench > "$RESULTS_FOLDER/alias.bench"
1919
./$BENCHMARKS_FOLDER/json-render-bench "./$FOLDER/src/benchmarks/portugal_to_korea.json" > "$RESULTS_FOLDER/json-render.bench"
2020
./$BENCHMARKS_FOLDER/packedvector-bench > "$RESULTS_FOLDER/packedvector.bench"
2121
./$BENCHMARKS_FOLDER/rtree-bench "./$FOLDER/test/data/monaco.osrm.ramIndex" "./$FOLDER/test/data/monaco.osrm.fileIndex" "./$FOLDER/test/data/monaco.osrm.nbg_nodes" > "$RESULTS_FOLDER/rtree.bench"
22+
23+
BINARIES_FOLDER="$FOLDER/build"
24+
25+
cp ~/data.osm.pbf $FOLDER
26+
$BINARIES_FOLDER/osrm-extract -p $FOLDER/profiles/car.lua $FOLDER/data.osm.pbf
27+
$BINARIES_FOLDER/osrm-partition $FOLDER/data.osrm
28+
$BINARIES_FOLDER/osrm-customize $FOLDER/data.osrm
29+
$BINARIES_FOLDER/osrm-contract $FOLDER/data.osrm
30+
31+
if [ -f "$FOLDER/scripts/ci/locustfile.py" ]; then
32+
for ALGORITHM in mld ch; do
33+
$BINARIES_FOLDER/osrm-routed --algorithm $ALGORITHM $FOLDER/data.osrm &
34+
OSRM_ROUTED_PID=$!
35+
36+
# wait for osrm-routed to start
37+
curl --retry-delay 3 --retry 10 --retry-all-errors "http://127.0.0.1:5000/route/v1/driving/13.388860,52.517037;13.385983,52.496891?steps=true"
38+
locust -f $FOLDER/scripts/ci/locustfile.py \
39+
--headless \
40+
--processes -1 \
41+
--users 10 \
42+
--spawn-rate 1 \
43+
--host http://localhost:5000 \
44+
--run-time 1m \
45+
--csv=locust_results_$ALGORITHM \
46+
--loglevel ERROR
47+
48+
python3 $FOLDER/scripts/ci/process_locust_benchmark_results.py locust_results_$ALGORITHM $ALGORITHM $RESULTS_FOLDER
49+
50+
51+
kill -0 $OSRM_ROUTED_PID
52+
done
53+
fi
54+
2255
}
2356

2457
run_benchmarks_for_folder $1 "${1}_results"

test/data/berlin_gps_traces.csv.gz

518 KB
Binary file not shown.

0 commit comments

Comments
 (0)