Fix

pxsit · pxsit · commit a4e3cf0c0693 · 2025-08-05T22:29:56.000+07:00
diff --git a/cms/db/task.py b/cms/db/task.py
@@ -222,7 +222,7 @@ class Task(Base):
         default=SCORE_MODE_MAX_TOKENED_LAST)
 
     # Skip entire subtask on failed testcase when using GroupMin/GroupMul score types.
-    skip_failed_subtask: bool = Column(Boolean, nullable=False, default=True)
+    skip_failed_subtask: bool = Column(Boolean, nullable=False, default=False)
 
     # Active Dataset (id and object) currently being used for scoring.
     # The ForeignKeyConstraint for this column is set at table-level.
diff --git a/cms/grading/scoretypes/abc.py b/cms/grading/scoretypes/abc.py
@@ -6,6 +6,7 @@
 # Copyright © 2010-2012 Matteo Boscariol <boscarim@hotmail.com>
 # Copyright © 2013-2016 Luca Wehrstedt <luca.wehrstedt@gmail.com>
 # Copyright © 2015 wafrelka <wafrelka@gmail.com>
+# Copyright © 2025 Pasit Sangprachathanarak <ouipingpasit@gmail.com>
 #
 # This program is free software: you can redistribute it and/or modify
 # it under the terms of the GNU Affero General Public License as
@@ -285,6 +286,8 @@ class ScoreTypeGroup(ScoreTypeAlone):
                 <tr class="correct">
             {% elif tc["outcome"] == "Not correct" %}
                 <tr class="notcorrect">
+            {% elif tc["outcome"] == "Skipped" %}
+                <tr class="partiallycorrect">
             {% else %}
                 <tr class="partiallycorrect">
             {% endif %}
@@ -433,9 +436,13 @@ def compute_score(self, submission_result):
                 evaluation = evaluations[tc_idx]
 
                 # Handle skipped testcases specifically
-                if evaluation.outcome == "N/A" and evaluation.text == [
-                    "Skipped due to failed testcase in subtask"
-                ]:
+                if (
+                    evaluation.outcome == "N/A"
+                    and evaluation.text
+                    and len(evaluation.text) > 0
+                    and "Skipped due to failed testcase in subtask"
+                    in evaluation.text[0]
+                ):
                     tc_score = 0.0  # Skipped testcases count as 0.0 for scoring
                     tc_outcome = "Skipped"
                 elif evaluation.outcome == "N/A" or evaluation.outcome is None:
@@ -459,7 +466,9 @@ def compute_score(self, submission_result):
                     {
                         "idx": tc_idx,
                         "outcome": tc_outcome,
-                        "text": evaluation.text,
+                        "text": ["N/A"]
+                        if tc_outcome == "Skipped"
+                        else evaluation.text,  # Show N/A for skipped testcases
                         "time": evaluation.execution_time,
                         "time_limit": evaluation.dataset.time_limit,
                         "time_limit_was_exceeded": time_limit_was_exceeded,
@@ -476,7 +485,24 @@ def compute_score(self, submission_result):
                         tc_first_lowest_idx = tc_idx
                         tc_first_lowest_score = tc_score
                 else:
-                    public_testcases.append({"idx": tc_idx})
+                    # For non-public testcases, still show the outcome if it's "Skipped"
+                    # This ensures that skipped testcases are visible to contestants
+                    if tc_outcome == "Skipped":
+                        public_testcases.append(
+                            {
+                                "idx": tc_idx,
+                                "outcome": tc_outcome,
+                                "text": [
+                                    "N/A"
+                                ],
+                                "time": None,
+                                "memory": None,
+                                "show_in_restricted_feedback": False,
+                                "show_in_oi_restricted_feedback": False,
+                            }
+                        )
+                    else:
+                        public_testcases.append({"idx": tc_idx})
 
             # Calculate scores considering skipped testcases as 0.0
             outcome_values = []
diff --git a/cms/grading/subtask_skipper.py b/cms/grading/subtask_skipper.py
@@ -41,7 +41,7 @@ def __init__(self, task, submission_result):
         self.task = task
         self.submission_result = submission_result
         self.dataset = submission_result.dataset if submission_result else None
-        self.skip_enabled = getattr(task, 'skip_failed_subtask', True)
+        self.skip_enabled = getattr(task, "skip_failed_subtask", False)
         self._subtask_groups = None
         self._failed_subtasks = set()
         self._skipped_testcases = set()
@@ -56,16 +56,35 @@ def should_skip_testcase(self, testcase_codename: str) -> bool:
         if not self.skip_enabled or not self.dataset:
             return False
 
-        # Only skip for GroupMin and GroupMul score types
         score_type = self.dataset.score_type
-        if score_type not in ['GroupMin', 'GroupMul']:
+        if score_type not in ["GroupMin", "GroupMul"]:
             return False
 
+        if testcase_codename in self._skipped_testcases:
+            return True
+
+        # Check if any earlier testcase in the same subtask has failed
         subtask_idx = self._get_subtask_for_testcase(testcase_codename)
         if subtask_idx is None:
             return False
 
-        return subtask_idx in self._failed_subtasks
+        # Check if this subtask has already failed due to an earlier testcase
+        if subtask_idx in self._failed_subtasks:
+            subtask_testcases = self._get_testcases_in_subtask(subtask_idx)
+            try:
+                current_testcase_idx = subtask_testcases.index(testcase_codename)
+                # Check if any earlier testcase in this subtask has failed
+                for i in range(current_testcase_idx):
+                    earlier_testcase = subtask_testcases[i]
+                    if self._is_testcase_failed(earlier_testcase):
+                        logger.info(
+                            f"Skipping testcase {testcase_codename} because earlier testcase {earlier_testcase} failed in subtask {subtask_idx}"
+                        )
+                        return True
+            except ValueError:
+                pass
+
+        return False
 
     def mark_testcase_failed(self, testcase_codename: str, outcome: float):
         """Mark a testcase as failed and potentially skip remaining testcases in the subtask.
@@ -76,31 +95,52 @@ def mark_testcase_failed(self, testcase_codename: str, outcome: float):
         if not self.skip_enabled or not self.dataset:
             return
 
-        # Only handle for GroupMin and GroupMul score types
         score_type = self.dataset.score_type
         if score_type not in ['GroupMin', 'GroupMul']:
             return
 
-        # Check if this testcase failed (outcome is 0.0 for failed)
+        # Check if this testcase failed
         if outcome > 0.0:
             return
 
         subtask_idx = self._get_subtask_for_testcase(testcase_codename)
         if subtask_idx is None:
+            logger.warning(f"Could not find subtask for testcase {testcase_codename}")
             return
 
         # Mark this subtask as failed
         self._failed_subtasks.add(subtask_idx)
         logger.info(f"Marking subtask {subtask_idx} as failed due to testcase {testcase_codename}")
 
-        # Get all testcases in this subtask and mark remaining ones as skipped
+        # Get all testcases in this subtask in order
         subtask_testcases = self._get_testcases_in_subtask(subtask_idx)
-        for tc_codename in subtask_testcases:
-            if tc_codename != testcase_codename:  # Skip the failing testcase itself
-                # Check if this testcase hasn't been evaluated yet
-                if not self._is_testcase_evaluated(tc_codename):
-                    self._skipped_testcases.add(tc_codename)
-                    logger.info(f"Marking testcase {tc_codename} as skipped in subtask {subtask_idx}")
+        logger.info(f"Subtask {subtask_idx} testcases in order: {subtask_testcases}")
+
+        # Find the position of the failing testcase
+        try:
+            failing_testcase_idx = subtask_testcases.index(testcase_codename)
+            logger.info(
+                f"Failing testcase {testcase_codename} is at position {failing_testcase_idx} in subtask {subtask_idx}"
+            )
+        except ValueError:
+            logger.warning(
+                f"Failed testcase {testcase_codename} not found in subtask {subtask_idx}"
+            )
+            return
+
+        # Skip only the testcases that come after the failing one in this subtask
+        for i in range(failing_testcase_idx + 1, len(subtask_testcases)):
+            tc_codename = subtask_testcases[i]
+            # Only skip if this testcase hasn't been started yet
+            if not self._is_testcase_started(tc_codename):
+                self._skipped_testcases.add(tc_codename)
+                logger.info(
+                    f"Marking testcase {tc_codename} (position {i}) as skipped in subtask {subtask_idx} (after failure of {testcase_codename})"
+                )
+            else:
+                logger.info(
+                    f"Testcase {tc_codename} (position {i}) already started/completed, not skipping"
+                )
 
     def get_skipped_testcases(self) -> Set[str]:
         """Get the set of testcase codenames that should be skipped."""
@@ -126,22 +166,31 @@ def _get_subtask_groups(self) -> Optional[Dict[int, List[str]]]:
 
             self._subtask_groups = {}
             testcase_names = sorted(self.dataset.testcases.keys())
+            logger.debug(f"All testcase names in order: {testcase_names}")
+            logger.debug(f"Score type parameters: {parameters}")
 
             for subtask_idx, parameter in enumerate(parameters):
                 if len(parameter) < 2:
                     continue
 
-                max_score, target = parameter[0], parameter[1]
+                _, target = (
+                    parameter[0],
+                    parameter[1],
+                )
 
                 if isinstance(target, int):
-                    # Number-based grouping: first N testcases
                     start_idx = sum(param[1] for param in parameters[:subtask_idx] if isinstance(param[1], int))
                     end_idx = start_idx + target
                     group_testcases = testcase_names[start_idx:end_idx]
+                    logger.debug(
+                        f"Subtask {subtask_idx} (number-based): testcases {start_idx}-{end_idx - 1} = {group_testcases}"
+                    )
                 elif isinstance(target, str):
-                    # Regex-based grouping
                     pattern = re.compile(target)
                     group_testcases = [tc for tc in testcase_names if pattern.match(tc)]
+                    logger.debug(
+                        f"Subtask {subtask_idx} (regex-based): pattern '{target}' = {group_testcases}"
+                    )
                 else:
                     continue
 
@@ -198,3 +247,52 @@ def _is_testcase_evaluated(self, testcase_codename: str) -> bool:
                 return True
 
         return False
+
+    def _is_testcase_started(self, testcase_codename: str) -> bool:
+        """Check if a testcase has been started (queued, running, or completed).
+
+        This is more comprehensive than _is_testcase_evaluated as it also
+        checks if the testcase is currently being evaluated.
+
+        testcase_codename: The codename of the testcase
+
+        Returns: True if the testcase has been started, False otherwise
+        """
+        # First check if it's already completed
+        if self._is_testcase_evaluated(testcase_codename):
+            return True
+
+        # For now, we'll use the same logic as _is_testcase_evaluated
+        # In the future, we could check if the testcase is currently
+        # In the evaluation queue or being processed
+        # But since we don't have easy access to the queue state here,
+        # we will only skip testcases that definitely
+        # haven't been touched yet.
+
+        # TODO: Could be enhanced to check the evaluation service queue
+        return self._is_testcase_evaluated(testcase_codename)
+
+    def _is_testcase_failed(self, testcase_codename: str) -> bool:
+        """Check if a testcase has failed (outcome <= 0.0).
+
+        testcase_codename: The codename of the testcase
+
+        Returns: True if the testcase failed, False otherwise
+        """
+        if not self.submission_result:
+            return False
+
+        for evaluation in self.submission_result.evaluations:
+            if evaluation.codename == testcase_codename:
+                try:
+                    outcome = (
+                        float(evaluation.outcome)
+                        if evaluation.outcome != "N/A"
+                        and evaluation.outcome is not None
+                        else 0.0
+                    )
+                    return outcome <= 0.0
+                except (ValueError, TypeError):
+                    return True  # If we can't parse the outcome, consider it failed
+
+        return False  # Not evaluated yet, so not failed
diff --git a/cms/server/admin/templates/task.html b/cms/server/admin/templates/task.html
@@ -242,6 +242,13 @@ <h2 id="title_task_configuration" class="toggling_on">Task configuration</h2>
       </tr>
 
       <tr><td colspan=2><h2>Score options</h2></td></tr>
+      <tr>
+        <td>
+          <span class="info" title="When enabled, if one testcase fails in a subtask (for GroupMin/GroupMul score types), remaining testcases in that subtask will be skipped and marked as 'Skipped'."></span>
+          Skip entire subtask on failed testcase
+        </td>
+        <td><input type="checkbox" name="skip_failed_subtask" /></td>
+      </tr>
       <tr>
         <td>
           <span class="info" title="The number of decimal places the scores will be rounded to.
@@ -263,13 +270,6 @@ <h2 id="title_task_configuration" class="toggling_on">Task configuration</h2>
           </select>
         </td>
       </tr>
-      <tr>
-        <td>
-          <span class="info" title="When enabled, if one testcase fails in a subtask (for GroupMin/GroupMul score types), remaining testcases in that subtask will be skipped and marked as 'Skipped'."></span>
-          Skip entire subtask on failed testcase
-        </td>
-        <td><input type="checkbox" name="skip_failed_subtask" {{ "checked" if task.skip_failed_subtask else "" }} /></td>
-      </tr>
     </table>
     <div class="hr"></div>
   </div>
diff --git a/cms/service/EvaluationService.py b/cms/service/EvaluationService.py
diff --git a/cmscontrib/updaters/update_from_1.5.sql b/cmscontrib/updaters/update_from_1.5.sql