Skip to content

Commit 38554d1

Browse files
Merge pull request #776 from fsschneider/scoring_QoL
Scoring: Quality of Life improvements
2 parents ec434a9 + 9b6c845 commit 38554d1

3 files changed

Lines changed: 14 additions & 13 deletions

File tree

README.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -29,7 +29,7 @@
2929
> [!IMPORTANT]
3030
> Submitters are no longer required to self-report results.
3131
> We are currently in the process of evaluating and scoring received submissions.
32-
> We are aiming to release results by July 15th 2024.
32+
> Results coming soon!
3333
> For other key dates please see [Call for Submissions](CALL_FOR_SUBMISSIONS.md).
3434
3535
## Table of Contents <!-- omit from toc -->

scoring/performance_profile.py

Lines changed: 12 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,6 @@
2626
the dictionary of submissions.
2727
"""
2828
import itertools
29-
import logging
3029
import operator
3130
import os
3231
import re
@@ -184,10 +183,10 @@ def get_workloads_time_to_target(submission,
184183
if strict:
185184
raise ValueError(
186185
f'Expecting {NUM_BASE_WORKLOADS + NUM_VARIANT_WORKLOADS} workloads '
187-
f'but found {num_workloads} workloads.')
186+
f'but found {num_workloads} workloads for {submission_name}.')
188187
logging.warning(
189188
f'Expecting {NUM_BASE_WORKLOADS + NUM_VARIANT_WORKLOADS} workloads '
190-
f'but found {num_workloads} workloads.')
189+
f'but found {num_workloads} workloads for {submission_name}.')
191190

192191
# For each workload get submission time get the submission times to target.
193192
for workload, group in submission.groupby('workload'):
@@ -198,11 +197,13 @@ def get_workloads_time_to_target(submission,
198197
num_studies = len(group.groupby('study'))
199198
if num_studies != NUM_STUDIES:
200199
if strict:
201-
raise ValueError(f'Expecting {NUM_STUDIES} trials for workload '
202-
f'{workload} but found {num_studies} trials.')
200+
raise ValueError(f'Expecting {NUM_STUDIES} studies for workload '
201+
f'{workload} but found {num_studies} studies '
202+
f'for {submission_name}.')
203203
else:
204-
logging.warning(f'Expecting {NUM_STUDIES} trials for workload '
205-
f'{workload} but found {num_studies} trials.')
204+
logging.warning(f'Expecting {NUM_STUDIES} studies for workload '
205+
f'{workload} but found {num_studies} studies '
206+
f'for {submission_name}.')
206207

207208
# For each study check trials
208209
for study, group in group.groupby('study'):
@@ -213,11 +214,13 @@ def get_workloads_time_to_target(submission,
213214
if strict:
214215
raise ValueError(
215216
f'In Study {study}: Expecting {NUM_TRIALS} trials for workload '
216-
f'{workload} but found {num_trials} trials.')
217+
f'{workload} but found {num_trials} trials '
218+
f'for {submission_name}.')
217219
else:
218220
logging.warning(
219221
f'In Study {study}: Expecting {NUM_TRIALS} trials for workload '
220-
f'{workload} but found {num_trials} trials.')
222+
f'{workload} but found {num_trials} trials '
223+
f'for {submission_name}.')
221224

222225
# Get trial and time index that reaches target
223226
trial_idx, time_idx = get_best_trial_index(
@@ -309,7 +312,6 @@ def compute_performance_profiles(submissions,
309312
df[df.apply(lambda x: x > 4 * best_scores, axis=1)] = np.inf
310313

311314
# For each held-out workload if variant target was not hit set submission to inf
312-
framework = None
313315
for workload in df.keys():
314316
if workload not in BASE_WORKLOADS:
315317
# If variants do not have finite score set base_workload score to inf

scoring/score_submissions.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,6 @@
1212
--compute_performance_profiles
1313
"""
1414

15-
import json
1615
import operator
1716
import os
1817
import pickle
@@ -136,7 +135,7 @@ def get_submission_summary(df, include_test_split=True):
136135
return df
137136

138137

139-
def compute_leaderboard_score(df, normalize=False):
138+
def compute_leaderboard_score(df, normalize=True):
140139
"""Compute leaderboard score by taking integral of performance profile.
141140
142141
Args:

0 commit comments

Comments
 (0)