feat: should done impl and test for accept string/language, but accept_same_language may need some adjustment after minimization is done

HongleiGu · HongleiGu · commit df12009f4a0c · 2026-01-13T22:35:15.000Z
diff --git a/evaluation_function/schemas/validation.py b/evaluation_function/schemas/validation.py
diff --git a/evaluation_function/validation/validation.py b/evaluation_function/validation/validation.py
@@ -0,0 +1,111 @@
+from itertools import product
+from typing import Set
+from ..schemas.fsa import FSA
+
+def is_valid_fsa(fsa: FSA) -> bool:
+    states = set(fsa.states)
+    alphabet = set(fsa.alphabet)
+
+    if fsa.initial_state not in states:
+        return False
+
+    if not set(fsa.accept_states).issubset(states):
+        return False
+
+    for t in fsa.transitions:
+        if t.from_state not in states:
+            return False
+        if t.to_state not in states:
+            return False
+        if t.symbol not in alphabet:
+            return False
+
+    return True
+
+def is_deterministic(fsa: FSA) -> bool:
+    if not is_valid_fsa(fsa):
+        return False
+
+    seen = set()
+
+    for t in fsa.transitions:
+        key = (t.from_state, t.symbol)
+        if key in seen:
+            return False
+        seen.add(key)
+
+    return True
+
+def is_complete(fsa: FSA) -> bool:
+    if not is_deterministic(fsa):
+        return False
+
+    states = set(fsa.states)
+    alphabet = set(fsa.alphabet)
+
+    seen = {(t.from_state, t.symbol) for t in fsa.transitions}
+
+    for state in states:
+        for symbol in alphabet:
+            if (state, symbol) not in seen:
+                return False
+
+    return True
+
+def classify_fsa(fsa: FSA) -> dict:
+    return {
+        "valid": is_valid_fsa(fsa),
+        "deterministic": is_deterministic(fsa),
+        "complete": is_complete(fsa),
+    }
+
+# simple bfs
+def accepts_string(fsa: FSA, string: str) -> bool:
+    """
+    Simulate the FSA on a given string.
+    Returns True if the string is accepted, False otherwise.
+    """
+    current_states: Set[str] = {fsa.initial_state}
+
+    for symbol in string:
+        next_states = set()
+        for state in current_states:
+            for t in fsa.transitions:
+                if t.from_state == state and t.symbol == symbol:
+                    next_states.add(t.to_state)
+        current_states = next_states
+        if not current_states:
+            return False
+
+    return any(state in fsa.accept_states for state in current_states)
+
+
+def fsas_accept_same_string(fsa1: FSA, fsa2: FSA, string: str) -> bool:
+    """
+    Check if two FSAs accept the same given string.
+    """
+    return accepts_string(fsa1, string) and accepts_string(fsa2, string)
+
+def fsas_accept_same_language(fsa1: FSA, fsa2: FSA, max_length: int = 5) -> bool:
+    """
+    Approximate check if two FSAs accept the same language.
+    Checks all strings over the alphabet up to length `max_length`.
+    Warning: exponential in alphabet size * max_length.
+    """
+    alphabet = fsa1.alphabet
+    if set(fsa1.alphabet) != set(fsa2.alphabet):
+        return False
+
+    for length in range(max_length + 1):
+        for s in product(alphabet, repeat=length):
+            string = ''.join(s)
+            if accepts_string(fsa1, string) != accepts_string(fsa2, string):
+                return False
+    return True
+# Note: This is practical for small alphabets and short strings.
+# For full correctness on infinite languages, you need minimized DFA equivalence.
+
+# is_nfa()
+# make_complete()
+# add_sink_state()
+
diff --git a/tests/validation/test_fsa_validation.py b/tests/validation/test_fsa_validation.py
@@ -1,10 +1,6 @@
 import unittest
 
-from evaluation_function.schemas.validation import (
-    is_valid_fsa,
-    is_deterministic,
-    is_complete,
-)
+from evaluation_function.validation.validation import *
 
 from evaluation_function.schemas.fsa import FSA, Transition
 from .utils import make_fsa
@@ -115,6 +111,52 @@ def test_single_state_complete_fsa(self):
         )
 
         self.assertTrue(is_complete(fsa))
+    
+    def test_accepts_string(self):
+        fsa = make_fsa(
+            states=["q0", "q1"],
+            alphabet=["a"],
+            transitions=[{"from_state": "q0", "to_state": "q1", "symbol": "a"}],
+            initial="q0",
+            accept=["q1"]
+        )
+
+        assert accepts_string(fsa, "a") is True
+        assert accepts_string(fsa, "") is False
+        assert accepts_string(fsa, "aa") is False
+    
+    def test_fsas_accept_same_language(self):
+        fsa1 = make_fsa(
+            states=["q0", "q1"],
+            alphabet=["a"],
+            transitions=[{"from_state": "q0", "to_state": "q1", "symbol": "a"}],
+            initial="q0",
+            accept=["q1"]
+        )
+
+        fsa2 = make_fsa(
+            states=["s0", "s1"],
+            alphabet=["a"],
+            transitions=[{"from_state": "s0", "to_state": "s1", "symbol": "a"}],
+            initial="s0",
+            accept=["s1"]
+        )
+
+        fsa3 = make_fsa(
+            states=["q0", "q1"],
+            alphabet=["a"],
+            transitions=[{"from_state": "q0", "to_state": "q1", "symbol": "a"}],
+            initial="q0",
+            accept=["q0"]  # different accept state
+        )
+
+        # fsa1 and fsa2 are equivalent
+        assert fsas_accept_same_language(fsa1, fsa2, max_length=1) is True
+
+        # fsa1 and fsa3 are not equivalent
+        assert fsas_accept_same_language(fsa1, fsa3, max_length=1) is False
+
+
 
 
 if __name__ == "__main__":