From 9133ae47ed01d44e9e0160764501e830879ffa51 Mon Sep 17 00:00:00 2001
From: Gunnar Kreitz <gkreitz@kattis.com>
Date: Mon, 24 Mar 2025 13:02:26 +0100
Subject: [PATCH 1/5] Add mypy to github workflow

---
 .github/workflows/python-app.yml |  5 ++++-
 mypy.ini                         | 23 +++++++++++++++++++++++
 2 files changed, 27 insertions(+), 1 deletion(-)
 create mode 100644 mypy.ini

diff --git a/.github/workflows/python-app.yml b/.github/workflows/python-app.yml
index 45c4851e..79b82285 100644
--- a/.github/workflows/python-app.yml
+++ b/.github/workflows/python-app.yml
@@ -31,7 +31,7 @@ jobs:
     - name: Install dependencies
       run: |
         python -m pip install --upgrade pip
-        pip install flake8 pytest
+        pip install flake8 pytest mypy
         if [ -f requirements.txt ]; then pip install -r requirements.txt; fi
     - name: Lint with flake8
       run: |
@@ -44,3 +44,6 @@ jobs:
       run:  make builddeb
     - name: Test with pytest
       run:  pytest
+    - name: Run mypy
+      run: |
+        mypy --non-interactive --config-file mypy.ini -p problemtools
diff --git a/mypy.ini b/mypy.ini
new file mode 100644
index 00000000..ff182a3e
--- /dev/null
+++ b/mypy.ini
@@ -0,0 +1,23 @@
+[mypy]
+ignore_missing_imports = True
+install_types = True
+check_untyped_defs = True
+ignore_errors = False
+
+[mypy-problemtools.tests.*]
+ignore_errors = True
+
+[mypy-problemtools.generatedata]
+ignore_errors = True
+
+[mypy-problemtools.languages]
+ignore_errors = True
+
+[mypy-problemtools.template]
+ignore_errors = True
+
+[mypy-problemtools.run.checktestdata]
+ignore_errors = True
+
+[mypy-problemtools.run.viva]
+ignore_errors = True

From 54e187f8e63dcea166a836904f24560b6a254ec6 Mon Sep 17 00:00:00 2001
From: Gunnar Kreitz <gkreitz@kattis.com>
Date: Mon, 24 Mar 2025 13:02:53 +0100
Subject: [PATCH 2/5] Change type from list to tuple, helping mypy and being
 clearer

---
 problemtools/ProblemPlasTeX/__init__.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/problemtools/ProblemPlasTeX/__init__.py b/problemtools/ProblemPlasTeX/__init__.py
index f0a608e7..f7fb3d53 100644
--- a/problemtools/ProblemPlasTeX/__init__.py
+++ b/problemtools/ProblemPlasTeX/__init__.py
@@ -17,8 +17,8 @@ class ImageConverter(object):
     imageUnits = ''
 
     imageTypes = ['.png', '.jpg', '.jpeg', '.gif'] #, '.svg']
-    imageConversion = {'.pdf': ['.png',
-                                ['gs', '-dUseCropBox', '-sDEVICE=pngalpha', '-r300', '-o']]}
+    imageConversion = {'.pdf': ('.png',
+                                ['gs', '-dUseCropBox', '-sDEVICE=pngalpha', '-r300', '-o'])}
 
     def __init__(self, document):
         self.config = document.config

From 948db0f834366b35d4a057c94eb48dc7d7ae60eb Mon Sep 17 00:00:00 2001
From: Gunnar Kreitz <gkreitz@kattis.com>
Date: Mon, 24 Mar 2025 13:03:27 +0100
Subject: [PATCH 3/5] Fix name of exception (old one also worked, as parser
 does import * from Scanner, but felt weird)

---
 problemtools/config.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/problemtools/config.py b/problemtools/config.py
index bcc74896..4032c054 100644
--- a/problemtools/config.py
+++ b/problemtools/config.py
@@ -24,7 +24,7 @@ def load_config(configuration_file):
             try:
                 with open(path, 'r') as config:
                     new_config = yaml.safe_load(config.read())
-            except (yaml.parser.ParserError, yaml.parser.ScannerError) as err:
+            except (yaml.parser.ParserError, yaml.scanner.ScannerError) as err:
                 raise ConfigError('Config file %s: failed to parse: %s' % (path, err))
         if res is None:
             if new_config is None:

From ec4bf5d47741b3d5841b634c0346ecc59f650d4f Mon Sep 17 00:00:00 2001
From: Gunnar Kreitz <gkreitz@kattis.com>
Date: Mon, 24 Mar 2025 13:04:21 +0100
Subject: [PATCH 4/5] Add type annotations and abstract class markers

---
 .../ProblemPlasTeX/ProblemsetMacros.py         |  2 +-
 problemtools/languages.py                      |  4 ++--
 problemtools/run/program.py                    |  8 +++++++-
 problemtools/verifyproblem.py                  | 18 +++++++++---------
 4 files changed, 19 insertions(+), 13 deletions(-)

diff --git a/problemtools/ProblemPlasTeX/ProblemsetMacros.py b/problemtools/ProblemPlasTeX/ProblemsetMacros.py
index 31794c98..592a1bd1 100644
--- a/problemtools/ProblemPlasTeX/ProblemsetMacros.py
+++ b/problemtools/ProblemPlasTeX/ProblemsetMacros.py
@@ -69,7 +69,7 @@ class sampletableinteractive(Command):
     def read_sample_interaction(self, filename):
         data = io.open(filename, 'r', encoding='utf-8').read()
         messages = []
-        cur_msg = []
+        cur_msg: list[str] = []
         cur_mode = None
         for line in data.split('\n'):
             if not line: continue
diff --git a/problemtools/languages.py b/problemtools/languages.py
index 8c0c72c2..0da66722 100644
--- a/problemtools/languages.py
+++ b/problemtools/languages.py
@@ -186,7 +186,7 @@ def detect_language(self, file_list):
             list of files did not match any language in the set.
         """
         result = None
-        src = []
+        src: list[str] = []
         prio = 1e99
         for lang in self.languages.values():
             lang_src = lang.get_source_files(file_list)
@@ -236,7 +236,7 @@ def update(self, data):
             else:
                 self.languages[lang_id].update(lang_spec)
 
-        priorities = {}
+        priorities: dict[int, Language] = {}
         for (lang_id, lang) in self.languages.items():
             if lang.priority in priorities:
                 raise LanguageConfigError(
diff --git a/problemtools/run/program.py b/problemtools/run/program.py
index 023ff0e3..49cca332 100644
--- a/problemtools/run/program.py
+++ b/problemtools/run/program.py
@@ -9,10 +9,12 @@
 
 from .errors import ProgramError
 
+from abc import ABC, abstractmethod
+
 log = logging.getLogger(__name__)
 
 
-class Program(object):
+class Program(ABC):
     """Abstract base class for programs.
     """
 
@@ -21,6 +23,10 @@ def __init__(self) -> None:
         self._compile_lock = threading.Lock()
         self._compile_result: tuple[bool, str|None]|None = None
 
+    @abstractmethod
+    def get_runcmd(self, cwd = None, memlim = None) -> list[str]:
+        pass
+
     def run(self, infile='/dev/null', outfile='/dev/null', errfile='/dev/null',
             args=None, timelim=1000, memlim=1024, work_dir=None):
         """Run the program.
diff --git a/problemtools/verifyproblem.py b/problemtools/verifyproblem.py
index cd708c4e..270fcde4 100644
--- a/problemtools/verifyproblem.py
+++ b/problemtools/verifyproblem.py
@@ -33,7 +33,8 @@
 from . import languages
 from . import run
 
-from typing import Any, Callable, Literal, Pattern, Match, ParamSpec, TypeVar
+from abc import ABC
+from typing import Any, Callable, ClassVar, Literal, Pattern, Match, ParamSpec, Type, TypeVar
 
 log = logging.getLogger(__name__)
 
@@ -110,7 +111,7 @@ def wait_for_background_work(self) -> None:
         concurrent.futures.wait(self._background_work)
 
 
-class ProblemAspect:
+class ProblemAspect(ABC):
     max_additional_info = 15
     errors = 0
     warnings = 0
@@ -175,7 +176,7 @@ class ProblemPart(ProblemAspect):
     """Should always be overridden by the subclass. Specifies the name that will be used to refer
     to the part e.g for logs.
     """
-    PART_NAME = None
+    PART_NAME: ClassVar[str]
 
     """Should return all classes that need to be initialized before this one. It is sufficient to be
     a subclass of the classes listed. There should be exactly one subclass of each dependency in the
@@ -710,8 +711,7 @@ def all_datasets(self) -> list:
 
 class ProblemStatement(ProblemPart):
     PART_NAME = 'statement'
-
-    EXTENSIONS = []
+    EXTENSIONS: list[str] = []
 
     def setup(self):
         if not self.EXTENSIONS:
@@ -1727,7 +1727,7 @@ def check(self, context: Context) -> bool:
 
         return self._check_res
 
-PROBLEM_FORMATS = {
+PROBLEM_FORMATS: dict[str, dict[str, list[Type[ProblemPart]]]] = {
     'legacy': {
         'config':       [ProblemConfig],
         'statement':    [ProblemStatementLegacy, Attachments],
@@ -1753,13 +1753,13 @@ class Problem(ProblemAspect):
     of category -> part-types. You could for example have 'validators' -> [InputValidators, OutputValidators].
     """
     def __init__(self, probdir: str, parts: dict[str, list[type]] = PROBLEM_FORMATS['legacy']):
-        self.part_mapping: dict[str, list[type]] = parts
+        self.part_mapping: dict[str, list[Type[ProblemPart]]] = parts
         self.aspects: set[type] = {v for s in parts.values() for v in s}
         self.probdir = os.path.realpath(probdir)
         self.shortname: str|None = os.path.basename(self.probdir)
         super().__init__(self.shortname)
         self.language_config = languages.load_language_config()
-        self._data = {}
+        self._data: dict[str, dict] = {}
         self.debug(f'Problem-format: {parts}')
 
     def get(self, part) -> dict:
@@ -1777,7 +1777,7 @@ def __enter__(self) -> Problem:
 
         # Initialize the classes, making sure to resolve dependencies first
         initialized = set()
-        self.classes = {}
+        self.classes: dict[str, ProblemPart] = {}
 
         def init(_class):
             if _class.PART_NAME in initialized:

From a31d215add1b48d57f79f662ce93fc8c92f40153 Mon Sep 17 00:00:00 2001
From: Gunnar Kreitz <gkreitz@kattis.com>
Date: Mon, 24 Mar 2025 13:32:14 +0100
Subject: [PATCH 5/5] Add getProblemPart for when we need to access
 problem.classes

---
 problemtools/tests/test_verify_hello.py |  4 +--
 problemtools/verifyproblem.py           | 40 ++++++++++++++-----------
 2 files changed, 24 insertions(+), 20 deletions(-)

diff --git a/problemtools/tests/test_verify_hello.py b/problemtools/tests/test_verify_hello.py
index 48d38d9d..49ff53aa 100644
--- a/problemtools/tests/test_verify_hello.py
+++ b/problemtools/tests/test_verify_hello.py
@@ -12,5 +12,5 @@ def test_load_hello():
     with verify.Problem(string) as p:
         assert p.shortname == "hello"
         # pytest and fork don't go along very well, so just run aspects that work without run
-        assert p.classes[verify.ProblemConfig.PART_NAME].check(args)
-        assert p.classes[verify.Attachments.PART_NAME].check(args)
+        assert p.getProblemPart(verify.ProblemConfig).check(args)
+        assert p.getProblemPart(verify.Attachments).check(args)
diff --git a/problemtools/verifyproblem.py b/problemtools/verifyproblem.py
index 270fcde4..646e262f 100644
--- a/problemtools/verifyproblem.py
+++ b/problemtools/verifyproblem.py
@@ -220,8 +220,8 @@ def __init__(self, problem: Problem, aspect_name: str, base: str, testcasegroup:
         self._problem = problem
         self.testcasegroup = testcasegroup
         self.reuse_result_from: TestCase|None = None
-        self.counter = len(problem.classes[ProblemTestCases.PART_NAME].testcase_by_infile)
-        problem.classes[ProblemTestCases.PART_NAME].testcase_by_infile[self.infile] = self
+        self.counter = len(problem.getProblemPart(ProblemTestCases).testcase_by_infile)
+        problem.getProblemPart(ProblemTestCases).testcase_by_infile[self.infile] = self
 
     def check_newlines(self, filename: str) -> None:
         with open(filename, 'rb') as f:
@@ -259,7 +259,7 @@ def check(self, context: Context) -> bool:
         self.check_newlines(self.ansfile)
         self.check_size_limits(self.infile)
         self.check_size_limits(self.ansfile)
-        self._problem.classes[InputValidators.PART_NAME].validate(self)
+        self._problem.getProblemPart(InputValidators).validate(self)
         anssize = os.path.getsize(self.ansfile) / 1024.0 / 1024.0
         outputlim = self._problem.get(ProblemConfig)['limits']['output']
         if anssize > outputlim:
@@ -267,7 +267,7 @@ def check(self, context: Context) -> bool:
         elif 2 * anssize > outputlim:
             self.warning(f'Answer file ({anssize:.1f} Mb) is within 50% of output limit ({outputlim} Mb), you might want to increase output limit')
         if not self._problem.get(ProblemTestCases)['is_interactive']:
-            val_res = self._problem.classes[OutputValidators.PART_NAME].validate(self, self.ansfile)
+            val_res = self._problem.getProblemPart(OutputValidators).validate(self, self.ansfile)
             if val_res.verdict != 'AC':
                 if self.is_in_sample_group():
                     self.error(f'judge answer file got {val_res}')
@@ -286,8 +286,8 @@ def set_symlinks(self) -> None:
         if not os.path.islink(self.infile):
             return
         target = os.path.realpath(self.infile)
-        if target in self._problem.classes[ProblemTestCases.PART_NAME].testcase_by_infile:
-            self.reuse_result_from = self._problem.classes[ProblemTestCases.PART_NAME].testcase_by_infile[target]
+        if target in self._problem.getProblemPart(ProblemTestCases).testcase_by_infile:
+            self.reuse_result_from = self._problem.getProblemPart(ProblemTestCases).testcase_by_infile[target]
 
     def _check_symlinks(self) -> bool:
         if not os.path.islink(self.infile):
@@ -324,7 +324,7 @@ def run_submission(self, sub, runner: Runner, context: Context) -> Result:
     def run_submission_real(self, sub, context: Context, timelim: int, timelim_low: int, timelim_high: int) -> Result:
         # This may be called off-main thread.
         if self._problem.get(ProblemTestCases)['is_interactive']:
-            res_high = self._problem.classes[OutputValidators.PART_NAME].validate_interactive(self, sub, timelim_high, self._problem.classes[Submissions.PART_NAME])
+            res_high = self._problem.getProblemPart(OutputValidators).validate_interactive(self, sub, timelim_high, self._problem.getProblemPart(Submissions))
         else:
             outfile = os.path.join(self._problem.tmpdir, f'output-{self.counter}')
             errfile = os.path.join(self._problem.tmpdir, f'error-{self.counter}')
@@ -342,7 +342,7 @@ def run_submission_real(self, sub, context: Context, timelim: int, timelim_low:
                     info = None
                 res_high = SubmissionResult('RTE', additional_info=info)
             else:
-                res_high = self._problem.classes[OutputValidators.PART_NAME].validate(self, outfile)
+                res_high = self._problem.getProblemPart(OutputValidators).validate(self, outfile)
             res_high.runtime = runtime
 
         if res_high.runtime <= timelim_low:
@@ -510,10 +510,10 @@ def check(self, context: Context) -> bool:
         if self.config['grading'] not in ['default', 'custom']:
             self.error("Invalid grading policy in testdata.yaml")
 
-        if self.config['grading'] == 'custom' and len(self._problem.classes[Graders.PART_NAME]._graders) == 0:
-            self._problem.classes[Graders.PART_NAME].error(f'{self} has custom grading but no custom graders provided')
+        if self.config['grading'] == 'custom' and len(self._problem.getProblemPart(Graders)._graders) == 0:
+            self._problem.getProblemPart(Graders).error(f'{self} has custom grading but no custom graders provided')
         if self.config['grading'] == 'default' and Graders._default_grader is None:
-            self._problem.classes[Graders.PART_NAME].error(f'{self} has default grading but I could not find default grader')
+            self._problem.getProblemPart(Graders).error(f'{self} has default grading but I could not find default grader')
 
         if self.config['grading'] == 'default' and 'ignore_sample' in self.config['grader_flags'].split():
             if self._parent is not None:
@@ -687,7 +687,7 @@ def aggregate_results(self, sub, sub_results: list[SubmissionResult], shadow_res
             res.additional_info = judge_error.additional_info
             res.testcase = judge_error.testcase
         else:
-            res.verdict, score = self._problem.classes[Graders.PART_NAME].grade(sub_results, self, shadow_result)
+            res.verdict, score = self._problem.getProblemPart(Graders).grade(sub_results, self, shadow_result)
             if sub_results:
                 res.testcase = sub_results[-1].testcase
                 res.additional_info = sub_results[-1].additional_info
@@ -1658,7 +1658,7 @@ def fully_accepted(self, result: SubmissionResult) -> bool:
     def start_background_work(self, context: Context) -> None:
         # Send off an early background compile job for each submission and
         # validator, to avoid a bottleneck step at the start of each test run.
-        self.problem.classes[OutputValidators.PART_NAME].start_background_work(context)
+        self.problem.getProblemPart(OutputValidators).start_background_work(context)
         for acr in self._submissions:
             for sub in self._submissions[acr]:
                 context.submit_background_work(lambda s: s.compile(), sub)
@@ -1744,6 +1744,7 @@ def check(self, context: Context) -> bool:
 # parts tested in alphabetical order
 PROBLEM_PARTS = [*sorted({part for format in PROBLEM_FORMATS.values() for part in format})]
 
+_ProblemPartT = TypeVar("_ProblemPartT", bound=ProblemPart)
 class Problem(ProblemAspect):
     """Represents a checkable problem"""
 
@@ -1768,6 +1769,9 @@ def get(self, part) -> dict:
         assert part in self._data
         return self._data[part]
 
+    def getProblemPart(self, part: Type[_ProblemPartT]) -> _ProblemPartT:
+        return self._classes[part.PART_NAME] # type: ignore
+
     def __enter__(self) -> Problem:
         self.tmpdir = tempfile.mkdtemp(prefix=f'verify-{self.shortname}-')
         if not os.path.isdir(self.probdir):
@@ -1777,7 +1781,7 @@ def __enter__(self) -> Problem:
 
         # Initialize the classes, making sure to resolve dependencies first
         initialized = set()
-        self.classes: dict[str, ProblemPart] = {}
+        self._classes: dict[str, ProblemPart] = {}
 
         def init(_class):
             if _class.PART_NAME in initialized:
@@ -1794,8 +1798,8 @@ def init(_class):
                     raise NotImplementedError(f'Part "{_class.PART_NAME}" depends on part "{dependency.PART_NAME}" which showed up {cnt} times in problem-format (should have showed up exactly once)')
             self.debug(f'Initializing {_class.PART_NAME} ({_class})')
             assert _class.PART_NAME not in initialized
-            self.classes[_class.PART_NAME] = _class(self)
-            self._data[_class.PART_NAME] = self.classes[_class.PART_NAME].setup()
+            self._classes[_class.PART_NAME] = _class(self)
+            self._data[_class.PART_NAME] = self._classes[_class.PART_NAME].setup()
             initialized.add(_class.PART_NAME)
 
         for c in self.aspects:
@@ -1835,12 +1839,12 @@ def check(self, args: argparse.Namespace) -> tuple[int, int]:
             if executor:
                 for part in parts:
                     for item in self.part_mapping[part]:
-                        self.classes[item.PART_NAME].start_background_work(context)
+                        self._classes[item.PART_NAME].start_background_work(context)
 
             for part in parts:
                 self.msg(f'Checking {part}')
                 for item in self.part_mapping[part]:
-                    self.classes[item.PART_NAME].check(context)
+                    self._classes[item.PART_NAME].check(context)
         except VerifyError:
             pass
         finally: