1 // © 2016 and later: Unicode, Inc. and others.
2 // License & terms of use: http://www.unicode.org/copyright.html
3 /********************************************************************
4  * COPYRIGHT:
5  * Copyright (c) 2001-2016, International Business Machines Corporation and
6  * others. All Rights Reserved.
7  ********************************************************************/
8 
9 #ifndef RBBINODE_H
10 #define RBBINODE_H
11 
12 #include "unicode/utypes.h"
13 #include "unicode/unistr.h"
14 #include "unicode/uobject.h"
15 
16 //
17 //  class RBBINode
18 //
19 //                    Represents a node in the parse tree generated when reading
20 //                    a rule file.
21 //
22 
23 U_NAMESPACE_BEGIN
24 
25 class    UnicodeSet;
26 class    UVector;
27 
28 class RBBINode : public UMemory {
29     public:
30         enum NodeType {
31             setRef,
32             uset,
33             varRef,
34             leafChar,
35             lookAhead,
36             tag,
37             endMark,
38             opStart,
39             opCat,
40             opOr,
41             opStar,
42             opPlus,
43             opQuestion,
44             opBreak,
45             opReverse,
46             opLParen
47         };
48 
49         enum OpPrecedence {
50             precZero,
51             precStart,
52             precLParen,
53             precOpOr,
54             precOpCat
55         };
56 
57         NodeType      fType;
58         RBBINode      *fParent;
59         RBBINode      *fLeftChild;
60         RBBINode      *fRightChild;
61         UnicodeSet    *fInputSet;           // For uset nodes only.
62         OpPrecedence  fPrecedence;          // For binary ops only.
63 
64         UnicodeString fText;                // Text corresponding to this node.
65                                             //   May be lazily evaluated when (if) needed
66                                             //   for some node types.
67         int           fFirstPos;            // Position in the rule source string of the
68                                             //   first text associated with the node.
69                                             //   If there's a left child, this will be the same
70                                             //   as that child's left pos.
71         int           fLastPos;             //  Last position in the rule source string
72                                             //    of any text associated with this node.
73                                             //    If there's a right child, this will be the same
74                                             //    as that child's last postion.
75 
76         UBool         fNullable;            // See Aho.
77         int32_t       fVal;                 // For leafChar nodes, the value.
78                                             //   Values are the character category,
79                                             //   corresponds to columns in the final
80                                             //   state transition table.
81 
82         UBool         fLookAheadEnd;        // For endMark nodes, set TRUE if
83                                             //   marking the end of a look-ahead rule.
84 
85         UBool         fRuleRoot;            // True if this node is the root of a rule.
86         UBool         fChainIn;             // True if chaining into this rule is allowed
87                                             //     (no '^' present).
88 
89         UVector       *fFirstPosSet;
90         UVector       *fLastPosSet;         // TODO: rename fFirstPos & fLastPos to avoid confusion.
91         UVector       *fFollowPos;
92 
93 
94         RBBINode(NodeType t);
95         RBBINode(const RBBINode &other);
96         ~RBBINode();
97 
98         RBBINode    *cloneTree();
99         RBBINode    *flattenVariables();
100         void         flattenSets();
101         void         findNodes(UVector *dest, RBBINode::NodeType kind, UErrorCode &status);
102 
103 #ifdef RBBI_DEBUG
104         static void printNodeHeader();
105         static void printNode(const RBBINode *n);
106         static void printTree(const RBBINode *n, UBool withHeading);
107 #endif
108 
109     private:
110         RBBINode &operator = (const RBBINode &other); // No defs.
111         UBool operator == (const RBBINode &other);    // Private, so these functions won't accidently be used.
112 
113 #ifdef RBBI_DEBUG
114     public:
115         int           fSerialNum;           //  Debugging aids.
116 #endif
117 };
118 
119 #ifdef RBBI_DEBUG
120 U_CFUNC void
121 RBBI_DEBUG_printUnicodeString(const UnicodeString &s, int minWidth=0);
122 #endif
123 
124 U_NAMESPACE_END
125 
126 #endif
127 
128