Changes to satisfy mypy.

PGijsbers · PGijsbers · commit 0608e7a86c8b · 2019-04-15T17:58:56.000+02:00
diff --git a/openml/runs/run.py b/openml/runs/run.py
@@ -12,7 +12,13 @@
 import openml._api_calls
 from ..exceptions import PyOpenMLError
 from ..flows import get_flow
-from ..tasks import get_task, TaskTypeEnum
+from ..tasks import (get_task,
+                     TaskTypeEnum,
+                     OpenMLClassificationTask,
+                     OpenMLLearningCurveTask,
+                     OpenMLClusteringTask,
+                     OpenMLRegressionTask
+                     )
 
 
 class OpenMLRun(object):
@@ -108,24 +114,24 @@ def from_filesystem(cls, directory: str, expect_model: bool = True) -> 'OpenMLRu
         if not os.path.isfile(model_path) and expect_model:
             raise ValueError('Could not find model.pkl')
 
-        with open(description_path, 'r') as fp:
-            xml_string = fp.read()
+        with open(description_path, 'r') as fht:
+            xml_string = fht.read()
         run = openml.runs.functions._create_run_from_xml(xml_string, from_server=False)
 
         if run.flow_id is None:
             flow = openml.flows.OpenMLFlow.from_filesystem(directory)
             run.flow = flow
             run.flow_name = flow.name
 
-        with open(predictions_path, 'r') as fp:
-            predictions = arff.load(fp)
+        with open(predictions_path, 'r') as fht:
+            predictions = arff.load(fht)
             run.data_content = predictions['data']
 
         if os.path.isfile(model_path):
             # note that it will load the model if the file exists, even if
             # expect_model is False
-            with open(model_path, 'rb') as fp:
-                run.model = pickle.load(fp)
+            with open(model_path, 'rb') as fhb:
+                run.model = pickle.load(fhb)
 
         if os.path.isfile(trace_path):
             run.trace = openml.runs.OpenMLRunTrace._from_filesystem(trace_path)
@@ -208,7 +214,18 @@ def _generate_arff_dict(self) -> 'OrderedDict[str, Any]':
         arff_dict['relation'] =\
             'openml_task_{}_predictions'.format(task.task_id)
 
-        if task.task_type_id == TaskTypeEnum.SUPERVISED_CLASSIFICATION:
+        if isinstance(task, OpenMLLearningCurveTask):
+            class_labels = task.class_labels  # type: ignore
+            arff_dict['attributes'] = [('repeat', 'NUMERIC'),
+                                       ('fold', 'NUMERIC'),
+                                       ('sample', 'NUMERIC'),
+                                       ('row_id', 'NUMERIC')] + \
+                                      [('confidence.' + class_labels[i],
+                                        'NUMERIC') for i in
+                                       range(len(class_labels))] + \
+                                      [('prediction', class_labels),
+                                       ('correct', class_labels)]
+        elif isinstance(task, OpenMLClassificationTask):
             class_labels = task.class_labels
             instance_specifications = [('repeat', 'NUMERIC'),
                                        ('fold', 'NUMERIC'),
@@ -222,27 +239,14 @@ def _generate_arff_dict(self) -> 'OrderedDict[str, Any]':
             arff_dict['attributes'] = (instance_specifications
                                        + prediction_confidences
                                        + prediction_and_true)
-
-        elif task.task_type_id == TaskTypeEnum.LEARNING_CURVE:
-            class_labels = task.class_labels
-            arff_dict['attributes'] = [('repeat', 'NUMERIC'),
-                                       ('fold', 'NUMERIC'),
-                                       ('sample', 'NUMERIC'),
-                                       ('row_id', 'NUMERIC')] + \
-                                      [('confidence.' + class_labels[i],
-                                        'NUMERIC') for i in
-                                       range(len(class_labels))] + \
-                                      [('prediction', class_labels),
-                                       ('correct', class_labels)]
-
-        elif task.task_type_id == TaskTypeEnum.SUPERVISED_REGRESSION:
+        elif isinstance(task, OpenMLRegressionTask):
             arff_dict['attributes'] = [('repeat', 'NUMERIC'),
                                        ('fold', 'NUMERIC'),
                                        ('row_id', 'NUMERIC'),
                                        ('prediction', 'NUMERIC'),
                                        ('truth', 'NUMERIC')]
 
-        elif task.task_type == TaskTypeEnum.CLUSTERING:
+        elif isinstance(task, OpenMLClusteringTask):
             arff_dict['attributes'] = [('repeat', 'NUMERIC'),
                                        ('fold', 'NUMERIC'),
                                        ('row_id', 'NUMERIC'),
diff --git a/openml/runs/trace.py b/openml/runs/trace.py
@@ -32,7 +32,7 @@ def __init__(self, run_id, trace_iterations):
         self.run_id = run_id
         self.trace_iterations = trace_iterations
 
-    def get_selected_iteration(self, fold: int, repeat: int) -> 'OpenMLTraceIteration':
+    def get_selected_iteration(self, fold: int, repeat: int) -> int:
         """
         Returns the trace iteration that was marked as selected. In
         case multiple are marked as selected (should not happen) the
@@ -46,7 +46,7 @@ def get_selected_iteration(self, fold: int, repeat: int) -> 'OpenMLTraceIteratio
 
         Returns
         ----------
-        OpenMLTraceIteration
+        int
             The trace iteration from the given fold and repeat that was
             selected as the best iteration by the search procedure
         """