Better numbering usage + other small updates (#130)

eliotwrobson · web-flow · commit f5ed05a815cc · 2023-03-26T14:40:29.000-07:00
diff --git a/automata/fa/dfa.py b/automata/fa/dfa.py
@@ -633,7 +633,7 @@ def disjoint_state_fn(state_pair):
 
     def isempty(self):
         """Return True if this DFA is completely empty."""
-        return len(self._compute_reachable_states() & self.final_states) == 0
+        return self._compute_reachable_states().isdisjoint(self.final_states)
 
     def isfinite(self):
         """
@@ -1247,7 +1247,7 @@ def get_name_original(states):
 
             # Add NFA states to DFA as it is constructed from NFA.
             dfa_transitions[current_state_name] = {}
-            if (current_states & target_nfa.final_states):
+            if not current_states.isdisjoint(target_nfa.final_states):
                 dfa_final_states.add(current_state_name)
 
             # Enqueue the next set of current states for the generated DFA.
diff --git a/automata/fa/nfa.py b/automata/fa/nfa.py
@@ -1,7 +1,7 @@
 #!/usr/bin/env python3
 """Classes and methods for working with nondeterministic finite automata."""
 from collections import deque
-from itertools import chain, count, product
+from itertools import chain, count, product, repeat
 
 import networkx as nx
 from frozendict import frozendict
@@ -208,7 +208,7 @@ def _eliminate_lambda(self):
                     else:
                         state_transition_dict[input_symbol] = next_current_states
 
-            if (new_final_states & lambda_enclosure):
+            if not new_final_states.isdisjoint(lambda_enclosure):
                 new_final_states.add(state)
 
             if state in new_transitions:
@@ -238,7 +238,7 @@ def eliminate_lambda(self):
 
     def _check_for_input_rejection(self, current_states):
         """Raise an error if the given config indicates rejected input."""
-        if not (current_states & self.final_states):
+        if current_states.isdisjoint(self.final_states):
             raise exceptions.RejectionException(
                 'the NFA stopped on all non-final states ({})'.format(
                     ', '.join(str(state) for state in current_states)))
@@ -459,17 +459,17 @@ def intersection(self, other):
             epsilon_transitions_a = transitions_a.get('')
             if epsilon_transitions_a is not None:
                 state_dict = new_transitions.setdefault(curr_state, {})
-                state_dict.setdefault('', set()).update(product(epsilon_transitions_a, [q_b]))
-                next_states_iterables.append(product(epsilon_transitions_a, [q_b]))
+                state_dict.setdefault('', set()).update(zip(epsilon_transitions_a, repeat(q_b)))
+                next_states_iterables.append(zip(epsilon_transitions_a, repeat(q_b)))
 
             # Get transition dict for states in other
             transitions_b = other.transitions.get(q_b, {})
             # Add epsilon transitions for second set of transitions
             epsilon_transitions_b = transitions_b.get('')
             if epsilon_transitions_b is not None:
                 state_dict = new_transitions.setdefault(curr_state, {})
-                state_dict.setdefault('', set()).update(product([q_a], epsilon_transitions_b))
-                next_states_iterables.append(product([q_a], epsilon_transitions_b))
+                state_dict.setdefault('', set()).update(zip(repeat(q_a), epsilon_transitions_b))
+                next_states_iterables.append(zip(repeat(q_a), epsilon_transitions_b))
 
             # Add all transitions moving over same input symbols
             for symbol in new_input_symbols:
@@ -522,11 +522,11 @@ def shuffle_product(self, other):
 
             transitions_a = self.transitions.get(q_a, {})
             for symbol, end_states in transitions_a.items():
-                state_dict.setdefault(symbol, set()).update(product(end_states, [q_b]))
+                state_dict.setdefault(symbol, set()).update(zip(end_states, repeat(q_b)))
 
             transitions_b = other.transitions.get(q_b, {})
             for symbol, end_states in transitions_b.items():
-                state_dict.setdefault(symbol, set()).update(product([q_a], end_states))
+                state_dict.setdefault(symbol, set()).update(zip(repeat(q_a), end_states))
 
         return self.__class__(
             states=new_states,
@@ -658,10 +658,7 @@ def left_quotient(self, other):
 
             if old_transitions_dict:
                 for symbol, end_states in old_transitions_dict.items():
-                    new_state_dict[symbol] = {
-                        (end_state, state_b, True)
-                        for end_state in end_states
-                    }
+                    new_state_dict[symbol] = set(zip(end_states, repeat(state_b), repeat(True)))
 
         return self.__class__(
             states=new_states,
@@ -760,7 +757,7 @@ def is_final_state(states_pair):
             # If at least one of the current states is a final state, the
             # condition should satisfy
             return any(
-                len(nfa.final_states & nfa._lambda_closures[state]) > 0
+                not nfa.final_states.isdisjoint(nfa._lambda_closures[state])
                 for state in states
             )
 
diff --git a/automata/regex/parser.py b/automata/regex/parser.py
@@ -2,7 +2,7 @@
 """Classes and methods for parsing regexes into NFAs."""
 
 from collections import deque
-from itertools import chain, count, product, zip_longest
+from itertools import chain, count, product, repeat, zip_longest
 
 from automata.base.utils import get_renaming_function
 from automata.regex.lexer import Lexer
@@ -17,50 +17,51 @@
 class NFARegexBuilder:
     """Builder class designed for speed in parsing regular expressions into NFAs."""
 
-    __slots__ = ('_transitions', '_initial_state', '_final_states')
-    _state_name_counter = count(0)
+    __slots__ = ('_transitions', '_initial_state', '_final_states', '_state_name_counter')
 
-    def __init__(self, *, transitions, initial_state, final_states):
+    def __init__(self, *, transitions, initial_state, final_states, counter):
         """
         Initialize new builder class
         """
 
         self._transitions = transitions
         self._initial_state = initial_state
         self._final_states = final_states
+        self._state_name_counter = counter
 
     @classmethod
-    def from_string_literal(cls, literal):
+    def from_string_literal(cls, literal, counter):
         """
         Initialize this builder accepting only the given string literal
         """
 
         transitions = {
-            cls.__get_next_state_name(): {symbol: set()}
+            next(counter): {symbol: set()}
             for symbol in literal
         }
 
         for start_state, path in transitions.items():
             for end_states in path.values():
                 end_states.add(start_state+1)
 
-        final_state = cls.__get_next_state_name()
+        final_state = next(counter)
         transitions[final_state] = {}
 
         return cls(
             transitions=transitions,
             initial_state=min(transitions.keys()),
-            final_states={final_state}
+            final_states={final_state},
+            counter=counter
         )
 
     @classmethod
-    def wildcard(cls, input_symbols):
+    def wildcard(cls, input_symbols, counter):
         """
         Initialize this builder for a wildcard with the given input symbols
         """
 
-        initial_state = cls.__get_next_state_name()
-        final_state = cls.__get_next_state_name()
+        initial_state = next(counter)
+        final_state = next(counter)
 
         transitions = {
             initial_state: {symbol: {final_state} for symbol in input_symbols},
@@ -70,7 +71,8 @@ def wildcard(cls, input_symbols):
         return cls(
             transitions=transitions,
             initial_state=initial_state,
-            final_states={final_state}
+            final_states={final_state},
+            counter=counter
         )
 
     def union(self, other):
@@ -79,7 +81,7 @@ def union(self, other):
         """
         self._transitions.update(other._transitions)
 
-        new_initial_state = self.__get_next_state_name()
+        new_initial_state = next(self._state_name_counter)
 
         # Add epsilon transitions from new start state to old ones
         self._transitions[new_initial_state] = {
@@ -129,9 +131,9 @@ def intersection(self, other):
             if epsilon_transitions_a is not None:
                 state_dict = new_transitions.setdefault(curr_state_name, {})
                 state_dict.setdefault('', set()).update(
-                    map(get_state_name, product(epsilon_transitions_a, [q_b]))
+                    map(get_state_name, zip(epsilon_transitions_a, repeat(q_b)))
                 )
-                next_states_iterables.append(product(epsilon_transitions_a, [q_b]))
+                next_states_iterables.append(zip(epsilon_transitions_a, repeat(q_b)))
 
             # Get transition dict for states in other
             transitions_b = other._transitions.get(q_b, {})
@@ -140,9 +142,9 @@ def intersection(self, other):
             if epsilon_transitions_b is not None:
                 state_dict = new_transitions.setdefault(curr_state_name, {})
                 state_dict.setdefault('', set()).update(
-                    map(get_state_name, product([q_a], epsilon_transitions_b))
+                    map(get_state_name, zip(repeat(q_a), epsilon_transitions_b))
                 )
-                next_states_iterables.append(product([q_a], epsilon_transitions_b))
+                next_states_iterables.append(zip(repeat(q_a), epsilon_transitions_b))
 
             # Add all transitions moving over same input symbols
             for symbol in new_input_symbols:
@@ -190,7 +192,7 @@ def kleene_plus(self):
         """
         Apply the kleene plus operation to the NFA represented by this builder
         """
-        new_initial_state = self.__get_next_state_name()
+        new_initial_state = next(self._state_name_counter)
 
         self._transitions[new_initial_state] = {
             '': {self._initial_state}
@@ -205,7 +207,7 @@ def option(self):
         """
         Apply the option operation to the NFA represented by this builder
         """
-        new_initial_state = self.__get_next_state_name()
+        new_initial_state = next(self._state_name_counter)
 
         self._transitions[new_initial_state] = {
             '': {self._initial_state}
@@ -232,21 +234,17 @@ def shuffle_product(self, other):
 
             for symbol, end_states in transitions_a.items():
                 state_dict.setdefault(symbol, set()).update(
-                    map(get_state_name, product(end_states, [q_b]))
+                    map(get_state_name, zip(end_states, repeat(q_b)))
                 )
 
             for symbol, end_states in transitions_b.items():
                 state_dict.setdefault(symbol, set()).update(
-                    map(get_state_name, product([q_a], end_states))
+                    map(get_state_name, zip(repeat(q_a), end_states))
                 )
 
         self._final_states = set(map(get_state_name, product(self._final_states, other._final_states)))
         self._transitions = new_transitions
 
-    @classmethod
-    def __get_next_state_name(cls):
-        return next(cls._state_name_counter)
-
 
 class UnionToken(InfixOperator):
     """Subclass of infix operator defining the union operator."""
@@ -328,19 +326,24 @@ def op(self, left, right):
 class StringToken(Literal):
     """Subclass of literal token defining a string literal."""
 
+    def __init__(self, text, counter):
+        super().__init__(text)
+        self.counter = counter
+
     def val(self):
-        return NFARegexBuilder.from_string_literal(self.text)
+        return NFARegexBuilder.from_string_literal(self.text, self.counter)
 
 
 class WildcardToken(Literal):
     """Subclass of literal token defining a wildcard literal."""
 
-    def __init__(self, text, input_symbols):
+    def __init__(self, text, input_symbols, counter):
         super().__init__(text)
         self.input_symbols = input_symbols
+        self.counter = counter
 
     def val(self):
-        return NFARegexBuilder.wildcard(self.input_symbols)
+        return NFARegexBuilder.wildcard(self.input_symbols, self.counter)
 
 
 def add_concat_tokens(token_list):
@@ -372,17 +375,18 @@ def add_concat_tokens(token_list):
 def get_regex_lexer(input_symbols):
     """Get lexer for parsing regular expressions."""
     lexer = Lexer()
+    state_name_counter = count(0)
 
     lexer.register_token(LeftParen, r'\(')
     lexer.register_token(RightParen, r'\)')
-    lexer.register_token(StringToken, r'[A-Za-z0-9]')
+    lexer.register_token(lambda text: StringToken(text, state_name_counter), r'[A-Za-z0-9]')
     lexer.register_token(UnionToken, r'\|')
     lexer.register_token(IntersectionToken, r'\&')
     lexer.register_token(ShuffleToken, r'\^')
     lexer.register_token(KleeneStarToken, r'\*')
     lexer.register_token(KleenePlusToken, r'\+')
     lexer.register_token(OptionToken, r'\?')
-    lexer.register_token(lambda text: WildcardToken(text, input_symbols), r'\.')
+    lexer.register_token(lambda text: WildcardToken(text, input_symbols, state_name_counter), r'\.')
 
     return lexer
 
@@ -391,7 +395,7 @@ def parse_regex(regexstr, input_symbols):
     """Return an NFARegexBuilder corresponding to regexstr."""
 
     if len(regexstr) == 0:
-        return NFARegexBuilder.from_string_literal(regexstr)
+        return NFARegexBuilder.from_string_literal(regexstr, count(0))
 
     lexer = get_regex_lexer(input_symbols)
     lexed_tokens = lexer.lex(regexstr)