Fixed some issues with input symbols and inequalities in criteria

KarlLundengaard · KarlLundengaard · commit b2d788254a44 · 2025-06-03T16:44:40.000+01:00
- Made criteria keywords protected from input symbol aliasing
- Added extra outcome when order or equality comparison generates an error (e.g. when checking if a &gt; b where a and b are functions of x and a &gt; b for some values of x but not for others).
diff --git a/app/context/symbolic.py b/app/context/symbolic.py
@@ -90,7 +90,10 @@ def do_comparison(comparison_symbol, expression):
         "<=": lambda expr: bool(expression.cancel().simplify().simplify() <= 0),
     }
     comparison = comparisons[comparison_symbol.strip()]
-    result = comparison(expression)
+    try:
+        result = comparison(expression)
+    except Exception:
+        result = None
     return result
 
 
@@ -218,10 +221,14 @@ def mathematical_equivalence(unused_input):
             return {
                 label+"_TRUE": None
             }
-        else:
+        elif result is False:
             return {
                 label+"_FALSE": None
             }
+        else:
+            return {
+                label+"_UNKNOWN": None
+            }
 
     def set_equivalence(unused_input):
         matches = {"responses": [False]*len(response_list), "answers": [False]*len(answer_list)}
@@ -718,14 +725,19 @@ def criterion_eval_node(criterion, parameters_dict, generate_feedback=True):
     def evaluation_node_internal(unused_input):
         result = check_criterion(criterion, parameters_dict, generate_feedback)
         label = criterion.content_string()
-        if result:
+        if result is True:
             return {
                 label+"_TRUE": feedback_string_generator_inputs
             }
-        else:
+        elif result is False:
             return {
                 label+"_FALSE": feedback_string_generator_inputs
             }
+        else:
+            return {
+                label+"_UNKNOWN": feedback_string_generator_inputs
+            }
+
     label = criterion.content_string()
     graph = CriteriaGraph(label)
     END = CriteriaGraph.END
@@ -747,6 +759,14 @@ def evaluation_node_internal(unused_input):
         feedback_string_generator=symbolic_feedback_string_generators["GENERIC"]("FALSE")
     )
     graph.attach(label+"_FALSE", END.label)
+    graph.attach(
+        label,
+        label+"_UNKNOWN",
+        summary="True",
+        details=label+" is false.",
+        feedback_string_generator=symbolic_feedback_string_generators["GENERIC"]("FALSE")
+    )
+    graph.attach(label+"_UNKNOWN", END.label)
     return graph
 
 
diff --git a/app/docs/user.md b/app/docs/user.md
@@ -37,6 +37,20 @@ The `criteria` parameter reserves `response` and `answer` as keywords that will
 
 **Note:** The `criteria` parameters functionality is currently under development and will rarely produce appropriate feedback and can be quite difficult to debug.
 
+### Available criteria
+
+**Note:** In the table below EXPRESSION is used to denote some mathematical expression, i.e. a string that contains mathematical symbols and operators, but no equal signs `=` or inequality signs `>`, '<'.
+
+| Name  | Syntax                         | Description                         | Example             |
+|-------|:-------------------------------|:------------------------------------|:--------------------|
+| EQUAL | `EXPRESSION = EXPRESSION`      | Checks if the expressions are equal | `answer = response` - Default way to check equality of expressions |
+| ORDER | `EXPRESSION ORDER EXPRESSION`  | Checks if the expressions have the given order. ORDER operators can be `>`, `<`, `>=`, `<=` | `answer > response` - Checks if the answer is greater than the response |
+| WHERE | `EXPRESSION = EXPRESSION where EXPRESSION = EXPRESSION; ... ; EXPRESSION = EXPRESSION` | Checks if the equality on the left side of `where` are equal if the equalities in the comma-separated list on the right side of `where` | `answer = response where x = 0` - Checks if the curves given by the answer and the response intersect when $x=0$. |
+| WRITTEN_AS | `EXPRESSION written as EXPRESSION` | Syntactical comparison, checks if the two expressions are written the same way. | `response written as answer` - Checks if the response is written in the same for as the answer (e.g. if answer is `(x+1)(x+2)` then the response `x^2+3x+2` will not satisfy the criteria but `(x+3)(x+4)` will). |
+| PROPORTIONAL | `EXPRESSION proportional to EXPRESSION` | Checks if one expression can be written is equivalent to the other expression multiplied by some constant. | `answer proportional to response` |
+| CONTAINS | `EXPRESSION contains EXPRESSION` | Checks if the left expression has the right expression as a subexpression. | `response contains x` - Checks if the response contains the symbol x |
+
+
 ## `elementary_functions`
 
 When using implicit multiplication function names with multiple characters are sometimes split and not interpreted properly. Setting `elementary_functions` to true will reserve the function names listed below and prevent them from being split. If a name is said to have one or more alternatives this means that it will accept the alternative names but the reserved name is what will be shown in the preview.
diff --git a/app/evaluation.py b/app/evaluation.py
@@ -55,7 +55,7 @@ def determine_context(parameters):
             input_symbols_reserved_codes.append(input_symbol[0])
             input_symbols_reserved_aliases += [ip for ip in input_symbol[1] if len(ip.strip()) > 0]
 
-    reserved_keywords_codes = {"where", "written as"}
+    reserved_keywords_codes = {"where", "written as", "contains"}
     reserved_keywords_aliases = {"plus_minus", "minus_plus"}
     for re in parameters["reserved_expressions_strings"].values():
         reserved_keywords_aliases = reserved_keywords_aliases.union(set(re.keys()))
@@ -239,12 +239,6 @@ def evaluation_function(response, answer, params, include_test_data=False) -> di
 
     parameters = deepcopy(params)
 
-    # CONSIDER: Can this be moved into the preprocessing procedures in a consistent way?
-    # Can it be turned into its own context? Or moved into the determine_context procedure?
-    # What solution will be most consistently reusable?
-    if parameters.get("is_latex", False):
-        response = parse_latex(response, parameters.get("symbols", {}), False)
-
     reserved_expressions_strings = {
         "learner": {
             "response": response
@@ -269,13 +263,31 @@ def evaluation_function(response, answer, params, include_test_data=False) -> di
     else:
         evaluation_result.latex = preview["latex"]
         evaluation_result.simplified = preview["sympy"]
+
+    reserved_expressions_keys = list(reserved_expressions_strings["learner"].keys())+list(reserved_expressions_strings["task"].keys())
     parameters.update(
         {
             "context": context,
-            "parsing_parameters": context["parsing_parameters_generator"](parameters),
+            "reserved_keywords": context["reserved_keywords"]+reserved_expressions_keys,
+        }
+    )
+    parsing_parameters = context["parsing_parameters_generator"](parameters, unsplittable_symbols=reserved_expressions_keys) 
+    parameters.update(
+        {
+            "parsing_parameters": parsing_parameters,
         }
     )
 
+    # CONSIDER: Can this be moved into the preprocessing procedures in a consistent way?
+    # Can it be turned into its own context? Or moved into the determine_context procedure?
+    # What solution will be most consistently reusable?
+    if parameters.get("is_latex", False):
+        parameters["reserved_expressions_strings"]["learner"].update(
+            {
+                "response": parse_latex(response, parameters.get("symbols", {}), False, parameters=parameters),
+            }
+        )
+
     # FIXME: Move this into expression_utilities
     if params.get("strict_syntax", True):
         if "^" in response:
@@ -287,13 +299,10 @@ def evaluation_function(response, answer, params, include_test_data=False) -> di
     if reserved_expressions_success is False:
         return evaluation_result.serialise(include_test_data)
     reserved_expressions_parsed = {**reserved_expressions["learner"], **reserved_expressions["task"]}
-    parameters.update({"reserved_keywords": parameters["context"]["reserved_keywords"]+list(reserved_expressions_parsed.keys())})
 
     criteria_parser = context["generate_criteria_parser"](reserved_expressions)
     criteria = create_criteria_dict(criteria_parser, parameters)
 
-    parsing_parameters = parameters["context"]["parsing_parameters_generator"](parameters, unsplittable_symbols=list(reserved_expressions_parsed.keys()))
-
     evaluation_parameters = FrozenValuesDictionary(
         {
             "reserved_expressions_strings": reserved_expressions_strings,
diff --git a/app/evaluation_tests.py b/app/evaluation_tests.py
@@ -23,10 +23,10 @@ class TestEvaluationFunction():
     """
 
     # Import tests that makes sure that mathematical expression comparison works as expected
-    from .tests.symbolic_evaluation_tests import TestEvaluationFunction as TestSymbolicComparison
+    #from .tests.symbolic_evaluation_tests import TestEvaluationFunction as TestSymbolicComparison
 
     # Import tests that makes sure that physical quantities are handled as expected
-    from .tests.physical_quantity_evaluation_tests import TestEvaluationFunction as TestQuantities
+    #from .tests.physical_quantity_evaluation_tests import TestEvaluationFunction as TestQuantities
 
     # Import tests that corresponds to examples in documentation and examples module
     from .tests.example_tests import TestEvaluationFunction as TestExamples
@@ -81,4 +81,4 @@ def test_CHEM40002_1_5_instance_2024_25(self):
 
 
 if __name__ == "__main__":
-    pytest.main(['-k not slow', '--tb=line', '--durations=10', os.path.abspath(__file__)])
+    pytest.main(['-xk not slow', '--tb=short', '--durations=10', os.path.abspath(__file__)])
diff --git a/app/tests/example_tests.py b/app/tests/example_tests.py
@@ -507,6 +507,54 @@ def test_syntactical_comparison(self, response, answer, criteria, value, feedbac
         assert result["is_correct"] is value
         assert set(feedback_tags) == set(result["tags"])
 
+    @pytest.mark.parametrize(
+        "response, answer, criteria, value, feedback_tags, additional_params",
+        [
+            (
+                "2*x^2+0.5+0.25*sin(x)^2",
+                "2*x^2",
+                "answer <= response, 2+answer > response",
+                False,
+                [
+                    "answer <= response_TRUE",
+                    "2+answer > response_UNKNOWN",
+                ],
+                {
+                    "symbol_assumptions": "('x', 'real')"
+                }
+            ),
+            (
+                "pi*n",
+                "0",
+                "sin(response)=0, response contains n",
+                True,
+                [
+                    "sin(response)=0_TRUE",
+                    "sin(response)=0_SAME_SYMBOLS_TRUE",
+                    "response contains n_TRUE",
+                ],
+                {
+                    "symbols": {
+                        "n": {
+                            "latex": r"\(n\)",
+                            "aliases": ["i", "k", "N", "I", "K"],
+                        },
+                    },
+                    "symbol_assumptions": "('n', 'integer')"
+                }
+            ),
+        ]
+    )
+    def test_custom_comparison_with_criteria(self, response, answer, criteria, value, feedback_tags, additional_params):
+        params = {
+            "strict_syntax": False,
+            "elementary_functions": True,
+            "criteria": criteria,
+        }
+        params.update(additional_params)
+        result = evaluation_function(response, answer, params, include_test_data=True)
+        assert result["is_correct"] is value
+        assert set(feedback_tags) == set(result["tags"])
 
 if __name__ == "__main__":
     pytest.main(['-sk not slow', "--tb=line", os.path.abspath(__file__)])
diff --git a/app/utility/expression_utilities.py b/app/utility/expression_utilities.py
@@ -616,6 +616,7 @@ def create_sympy_parsing_params(params, unsplittable_symbols=tuple(), symbol_ass
         "rationalise": params.get("rationalise", True),
         "constants": set(),
         "complexNumbers": params["complexNumbers"],
+        "reserved_keywords": params.get("reserved_keywords",[]),
     }
 
     symbol_assumptions = list(symbol_assumptions)

Original file line number	Diff line number	Diff line change
`@@ -616,6 +616,7 @@ def create_sympy_parsing_params(params, unsplittable_symbols=tuple(), symbol_ass`
`616`	`616`	`"rationalise": params.get("rationalise", True),`
`617`	`617`	`"constants": set(),`
`618`	`618`	`"complexNumbers": params["complexNumbers"],`
	`619`	`+ "reserved_keywords": params.get("reserved_keywords",[]),`
`619`	`620`	`}`
`620`	`621`
`621`	`622`	`symbol_assumptions = list(symbol_assumptions)`