Skip to content

Commit 2d1ac6f

Browse files
Merge pull request #777 from mlcommons/dev
Dev -> Main
2 parents ca3347a + 38554d1 commit 2d1ac6f

2 files changed

Lines changed: 13 additions & 12 deletions

File tree

scoring/performance_profile.py

Lines changed: 12 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,6 @@
2626
the dictionary of submissions.
2727
"""
2828
import itertools
29-
import logging
3029
import operator
3130
import os
3231
import re
@@ -184,10 +183,10 @@ def get_workloads_time_to_target(submission,
184183
if strict:
185184
raise ValueError(
186185
f'Expecting {NUM_BASE_WORKLOADS + NUM_VARIANT_WORKLOADS} workloads '
187-
f'but found {num_workloads} workloads.')
186+
f'but found {num_workloads} workloads for {submission_name}.')
188187
logging.warning(
189188
f'Expecting {NUM_BASE_WORKLOADS + NUM_VARIANT_WORKLOADS} workloads '
190-
f'but found {num_workloads} workloads.')
189+
f'but found {num_workloads} workloads for {submission_name}.')
191190

192191
# For each workload get submission time get the submission times to target.
193192
for workload, group in submission.groupby('workload'):
@@ -198,11 +197,13 @@ def get_workloads_time_to_target(submission,
198197
num_studies = len(group.groupby('study'))
199198
if num_studies != NUM_STUDIES:
200199
if strict:
201-
raise ValueError(f'Expecting {NUM_STUDIES} trials for workload '
202-
f'{workload} but found {num_studies} trials.')
200+
raise ValueError(f'Expecting {NUM_STUDIES} studies for workload '
201+
f'{workload} but found {num_studies} studies '
202+
f'for {submission_name}.')
203203
else:
204-
logging.warning(f'Expecting {NUM_STUDIES} trials for workload '
205-
f'{workload} but found {num_studies} trials.')
204+
logging.warning(f'Expecting {NUM_STUDIES} studies for workload '
205+
f'{workload} but found {num_studies} studies '
206+
f'for {submission_name}.')
206207

207208
# For each study check trials
208209
for study, group in group.groupby('study'):
@@ -213,11 +214,13 @@ def get_workloads_time_to_target(submission,
213214
if strict:
214215
raise ValueError(
215216
f'In Study {study}: Expecting {NUM_TRIALS} trials for workload '
216-
f'{workload} but found {num_trials} trials.')
217+
f'{workload} but found {num_trials} trials '
218+
f'for {submission_name}.')
217219
else:
218220
logging.warning(
219221
f'In Study {study}: Expecting {NUM_TRIALS} trials for workload '
220-
f'{workload} but found {num_trials} trials.')
222+
f'{workload} but found {num_trials} trials '
223+
f'for {submission_name}.')
221224

222225
# Get trial and time index that reaches target
223226
trial_idx, time_idx = get_best_trial_index(
@@ -309,7 +312,6 @@ def compute_performance_profiles(submissions,
309312
df[df.apply(lambda x: x > 4 * best_scores, axis=1)] = np.inf
310313

311314
# For each held-out workload if variant target was not hit set submission to inf
312-
framework = None
313315
for workload in df.keys():
314316
if workload not in BASE_WORKLOADS:
315317
# If variants do not have finite score set base_workload score to inf

scoring/score_submissions.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,6 @@
1212
--compute_performance_profiles
1313
"""
1414

15-
import json
1615
import operator
1716
import os
1817
import pickle
@@ -136,7 +135,7 @@ def get_submission_summary(df, include_test_split=True):
136135
return df
137136

138137

139-
def compute_leaderboard_score(df, normalize=False):
138+
def compute_leaderboard_score(df, normalize=True):
140139
"""Compute leaderboard score by taking integral of performance profile.
141140
142141
Args:

0 commit comments

Comments
 (0)