1*c8dee2aaSAndroid Build Coastguard Worker /* 2*c8dee2aaSAndroid Build Coastguard Worker * Copyright 2017 Google Inc. 3*c8dee2aaSAndroid Build Coastguard Worker * 4*c8dee2aaSAndroid Build Coastguard Worker * Use of this source code is governed by a BSD-style license that can be 5*c8dee2aaSAndroid Build Coastguard Worker * found in the LICENSE file. 6*c8dee2aaSAndroid Build Coastguard Worker */ 7*c8dee2aaSAndroid Build Coastguard Worker 8*c8dee2aaSAndroid Build Coastguard Worker #ifndef SKSL_NFA 9*c8dee2aaSAndroid Build Coastguard Worker #define SKSL_NFA 10*c8dee2aaSAndroid Build Coastguard Worker 11*c8dee2aaSAndroid Build Coastguard Worker #include "src/sksl/lex/NFAState.h" 12*c8dee2aaSAndroid Build Coastguard Worker #include "src/sksl/lex/RegexNode.h" 13*c8dee2aaSAndroid Build Coastguard Worker 14*c8dee2aaSAndroid Build Coastguard Worker #include <string> 15*c8dee2aaSAndroid Build Coastguard Worker #include <utility> 16*c8dee2aaSAndroid Build Coastguard Worker #include <vector> 17*c8dee2aaSAndroid Build Coastguard Worker 18*c8dee2aaSAndroid Build Coastguard Worker /** 19*c8dee2aaSAndroid Build Coastguard Worker * A nondeterministic finite automaton for matching regular expressions. The NFA is initialized with 20*c8dee2aaSAndroid Build Coastguard Worker * a number of regular expressions, and then matches a string against all of them simultaneously. 21*c8dee2aaSAndroid Build Coastguard Worker */ 22*c8dee2aaSAndroid Build Coastguard Worker struct NFA { 23*c8dee2aaSAndroid Build Coastguard Worker /** 24*c8dee2aaSAndroid Build Coastguard Worker * Adds a new regular expression to the set of expressions matched by this automaton, returning 25*c8dee2aaSAndroid Build Coastguard Worker * its index. 26*c8dee2aaSAndroid Build Coastguard Worker */ addRegexNFA27*c8dee2aaSAndroid Build Coastguard Worker int addRegex(const RegexNode& regex) { 28*c8dee2aaSAndroid Build Coastguard Worker std::vector<int> accept; 29*c8dee2aaSAndroid Build Coastguard Worker // we reserve token 0 for END_OF_FILE, so this starts at 1 30*c8dee2aaSAndroid Build Coastguard Worker accept.push_back(this->addState(NFAState(++fRegexCount))); 31*c8dee2aaSAndroid Build Coastguard Worker std::vector<int> startStates = regex.createStates(this, accept); 32*c8dee2aaSAndroid Build Coastguard Worker fStartStates.insert(fStartStates.end(), startStates.begin(), startStates.end()); 33*c8dee2aaSAndroid Build Coastguard Worker return fStartStates.size() - 1; 34*c8dee2aaSAndroid Build Coastguard Worker } 35*c8dee2aaSAndroid Build Coastguard Worker 36*c8dee2aaSAndroid Build Coastguard Worker /** 37*c8dee2aaSAndroid Build Coastguard Worker * Adds a new state to the NFA, returning its index. 38*c8dee2aaSAndroid Build Coastguard Worker */ addStateNFA39*c8dee2aaSAndroid Build Coastguard Worker int addState(NFAState s) { 40*c8dee2aaSAndroid Build Coastguard Worker fStates.push_back(std::move(s)); 41*c8dee2aaSAndroid Build Coastguard Worker return fStates.size() - 1; 42*c8dee2aaSAndroid Build Coastguard Worker } 43*c8dee2aaSAndroid Build Coastguard Worker 44*c8dee2aaSAndroid Build Coastguard Worker /** 45*c8dee2aaSAndroid Build Coastguard Worker * Matches a string against all of the regexes added to this NFA. Returns the index of the first 46*c8dee2aaSAndroid Build Coastguard Worker * (in addRegex order) matching expression, or -1 if no match. This is relatively slow and used 47*c8dee2aaSAndroid Build Coastguard Worker * only for debugging purposes; the NFA should be converted to a DFA before actual use. 48*c8dee2aaSAndroid Build Coastguard Worker */ 49*c8dee2aaSAndroid Build Coastguard Worker int match(std::string s) const; 50*c8dee2aaSAndroid Build Coastguard Worker 51*c8dee2aaSAndroid Build Coastguard Worker int fRegexCount = 0; 52*c8dee2aaSAndroid Build Coastguard Worker 53*c8dee2aaSAndroid Build Coastguard Worker std::vector<NFAState> fStates; 54*c8dee2aaSAndroid Build Coastguard Worker 55*c8dee2aaSAndroid Build Coastguard Worker std::vector<int> fStartStates; 56*c8dee2aaSAndroid Build Coastguard Worker }; 57*c8dee2aaSAndroid Build Coastguard Worker 58*c8dee2aaSAndroid Build Coastguard Worker #endif 59