// Copyright (C) 2010 Internet Systems Consortium, Inc. ("ISC") // // Permission to use, copy, modify, and/or distribute this software for any // purpose with or without fee is hereby granted, provided that the above // copyright notice and this permission notice appear in all copies. // // THE SOFTWARE IS PROVIDED "AS IS" AND ISC DISCLAIMS ALL WARRANTIES WITH // REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY // AND FITNESS. IN NO EVENT SHALL ISC BE LIABLE FOR ANY SPECIAL, DIRECT, // INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM // LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE // OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR // PERFORMANCE OF THIS SOFTWARE. #ifndef _RBTREE_H #define _RBTREE_H 1 //! \file datasrc/rbtree.h /// /// \note The purpose of the RBTree is to provide a generic map with /// domain names as the key that can be used by various BIND 10 modules or /// even by other applications. However, because of some unresolved design /// issue, the design and interface are not fixed, and RBTree isn't ready /// to be used as a base data structure by other modules. #include #include #include #include #include #include #include #include #include namespace isc { namespace datasrc { namespace helper { /// \brief Helper function to remove the base domain from super domain. /// /// The precondition of this function is the super_name contains the /// sub_name so /// \code Name a("a.b.c"); /// Name b("b.c"); /// Name c = a - b; /// \endcode /// c will contain "a". /// /// \note Functions in this namespace is not intended to be used outside of /// RBTree implementation. inline isc::dns::Name operator-(const isc::dns::Name& super_name, const isc::dns::Name& sub_name) { return (super_name.split(0, super_name.getLabelCount() - sub_name.getLabelCount())); } } /// Forward declare RBTree class here is convinent for following friend /// class declare inside RBNode and RBTreeNodeChain template class RBTree; /// \brief \c RBNode is used by RBTree to store any data related to one domain /// name. /// /// This is meant to be used only from RBTree. It is meaningless to inherit it /// or create instances of it from elsewhere. For that reason, the constructor /// is private. /// /// It serves three roles. One is to keep structure of the \c RBTree as a /// red-black tree. For that purpose, it has left, right and parent pointers /// and color member. These are private and accessed only from within the tree. /// /// The second one is to store data for one domain name. The data related /// functions can be used to access and set the data. /// /// The third role is to keep the hierarchy of domains. The down pointer /// points to a subtree of subdomains. The parent pointer of a subtree's /// root node points to the parent leaf of the upper tree. /// /// One special kind of node is non-terminal node. It has subdomains with /// RRsets, but doesn't have any RRsets itself. template class RBNode : public boost::noncopyable { private: /// The RBNode is meant for use from within RBTree, so it has access to /// it. friend class RBTree; /// \brief Just a type alias /// /// We are going to use a lot of these offset pointers here and they /// have a long name. typedef boost::interprocess::offset_ptr > RBNodePtr; /// \name Constructors /// /// \note The existence of a RBNode without a RBTree is meaningless. /// Therefore the constructors are private. //@{ /// \brief Constructor from the node name. /// /// \param name The *relative* domain name (if this will live inside /// a.b.c and is called d.e.a.b.c, then you pass d.e). RBNode(const isc::dns::Name& name); //@} public: /// \brief Alias for shared pointer to the data. typedef boost::shared_ptr NodeDataPtr; /// Node flags. /// /// Each flag value defines a non default property for a specific node. /// These are defined as bitmask type values for the convenience of /// internal implementation, but applications are expected to use /// each flag separately via the enum definitions. /// /// All (settable) flags are off by default; they must be explicitly /// set to on by the \c setFlag() method. enum Flags { FLAG_CALLBACK = 1, ///< Callback enabled. See \ref callback FLAG_RED = 2, ///< Node color; 1 if node is red, 0 if node is black. FLAG_SUBTREE_ROOT = 4, ///< Set if the node is the root of a subtree FLAG_USER1 = 0x80000000U, ///< Application specific flag FLAG_USER2 = 0x40000000U, ///< Application specific flag FLAG_USER3 = 0x20000000U ///< Application specific flag }; private: // Some flag values are expected to be used for internal purposes // (e.g., representing the node color) in future versions, so we // limit the settable flags via the \c setFlag() method to those // explicitly defined in \c Flags. This constant represents all // such flags. static const uint32_t SETTABLE_FLAGS = (FLAG_CALLBACK | FLAG_USER1 | FLAG_USER2 | FLAG_USER3); public: /// \brief Destructor /// /// It might seem strange that constructors are private and destructor /// public, but this is needed because of shared pointers need access /// to the destructor. /// /// You should never call anything like: /// \code delete pointer_to_node; \endcode /// The RBTree handles both creation and destructoion of nodes. ~RBNode(); /// \name Getter functions. //@{ /// \brief Return the name of current node. /// /// It's relative to its containing node. /// /// To get the absolute name of one node, the node path from the top node /// to current node has to be recorded. const isc::dns::Name& getName() const { return (name_); } /// \brief Return the data stored in this node. /// /// You should not delete the data, it is handled by shared pointers. NodeDataPtr& getData() { return (data_); } /// \brief Return the data stored in this node. const NodeDataPtr& getData() const { return (data_); } /// \brief return whether the node has related data. /// /// There can be empty nodes inside the RBTree. They are usually the /// non-terminal domains, but it is possible (yet probably meaningless) /// empty nodes anywhere. bool isEmpty() const { return (data_.get() == NULL); } //@} /// \name Setter functions. //@{ /// \brief Set the data stored in the node. void setData(const NodeDataPtr& data) { data_ = data; } //@} /// \name Node flag manipulation methods //@{ /// Get the status of a node flag. /// /// This method returns whether the given node flag is set (enabled) /// on the node. The \c flag parameter is expected to be one of the /// defined \c Flags constants. For simplicity, the method interface /// does not prohibit passing an undefined flag or combined flags, but /// the return value in such a case will be meaningless for the caller /// (an application would have to use an ugly cast for such an unintended /// form of call, which will hopefully avoid accidental misuse). /// /// \exception None /// \param flag The flag to be tested. /// \return \c true if the \c flag is set; \c false otherwise. bool getFlag(Flags flag) const { return ((flags_ & flag) != 0); } /// Set or clear a node flag. /// /// This method changes the status of the specified node flag to either /// "on" (enabled) or "off" (disabled). The new status is specified by /// the \c on parameter. /// Like the \c getFlag() method, \c flag is expected to be one of the /// defined \c Flags constants. If an undefined or unsettable flag is /// specified, \c isc::InvalidParameter exception will be thrown. /// /// \exception isc::InvalidParameter Unsettable flag is specified /// \exception None otherwise /// \param flag The node flag to be changed. /// \param on If \c true, set the flag to on; otherwise set it to off. void setFlag(Flags flag, bool on = true) { if ((flag & ~SETTABLE_FLAGS) != 0) { isc_throw(isc::InvalidParameter, "Unsettable RBTree flag is being set"); } if (on) { flags_ |= flag; } else { flags_ &= ~flag; } } //@} private: /// \name Callback related methods /// /// See the description of \c RBTree::find() at \ref callback /// about callbacks. /// /// These methods never throw an exception. //@{ /// Return if callback is enabled at the node. //@} /// \brief Define rbnode color enum RBNodeColor {BLACK, RED}; /// \brief Returns the color of this node RBNodeColor getColor() const { if ((flags_ & FLAG_RED) != 0) { return (RED); } else { return (BLACK); } } /// \brief Sets the color of this node void setColor(const RBNodeColor color) { if (color == RED) { flags_ |= FLAG_RED; } else { flags_ &= ~FLAG_RED; } } void setSubTreeRoot(bool root) { if (root) { flags_ |= FLAG_SUBTREE_ROOT; } else { flags_ &= ~FLAG_SUBTREE_ROOT; } } bool isSubTreeRoot() const { return ((flags_ & FLAG_SUBTREE_ROOT) != 0); } public: /// \brief returns the parent of the root of its subtree /// /// This method takes a node and returns the parent of the root of /// its subtree (i.e, it returns the node's immediate ancestor in /// the tree-of-tree hierarchy). If the node is at the top level /// (which should be absolute), it will return \c NULL. /// /// This method never throws an exception. const RBNode* getUpperNode() const; private: /// \brief return the next node which is bigger than current node /// in the same subtree /// /// The next successor for this node is the next bigger node in terms of /// the DNSSEC order relation within the same single subtree. /// Note that it may NOT be the next bigger node in the entire RBTree; /// RBTree is a tree in tree, and the real next node may reside in /// an upper or lower subtree of the subtree where this node belongs. /// For example, if this node has a sub domain, the real next node is /// the smallest node in the sub domain tree. /// /// If this node is the biggest node within the subtree, this method /// returns \c NULL. /// /// This method never throws an exception. const RBNode* successor() const; /// \brief return the next node which is smaller than current node /// in the same subtree /// /// The predecessor for this node is the next smaller node in terms of /// the DNSSEC order relation within the same single subtree. /// Note that it may NOT be the next smaller node in the entire RBTree; /// RBTree is a tree in tree, and the real next node may reside in /// an upper or lower subtree of the subtree where this node belongs. /// For example, if the predecessor node has a sub domain, the real next /// node is the largest node in the sub domain tree. /// /// If this node is the smallest node within the subtree, this method /// returns \c NULL. /// /// This method never throws an exception. const RBNode* predecessor() const; /// \brief private shared implementation of successor and predecessor /// /// As the two mentioned functions are merely mirror images of each other, /// it makes little sense to keep both versions. So this is the body of the /// functions and we call it with the correct pointers. /// /// Not to be called directly, not even by friends. /// /// The overhead of the member pointers should be optimised out, as this /// will probably get completely inlined into predecessor and successor /// methods. const RBNode* abstractSuccessor(typename RBNode::RBNodePtr RBNode::*left, typename RBNode::RBNodePtr RBNode::*right) const; /// \name Data to maintain the rbtree structure. /// /// We keep them as offset pointers. This is part of a future plan, when we /// want to share the image of the tree between multiple processes. /// However, whenever we have a chance, we switch to bare pointers during /// the processing. The pointers on stack are never shared and the offset /// pointers have non-trivial performance impact. //@{ RBNodePtr parent_; /// \brief Access the parent_ as bare pointer. RBNode* getParent() { return (parent_.get()); } /// \brief Access the parent_ as bare pointer, const. const RBNode* getParent() const { return (parent_.get()); } RBNodePtr left_; /// \brief Access the left_ as bare pointer. RBNode* getLeft() { return (left_.get()); } /// \brief Access the left_ as bare pointer, const. const RBNode* getLeft() const { return (left_.get()); } RBNodePtr right_; /// \brief Access the right_ as bare pointer. RBNode* getRight() { return (right_.get()); } /// \brief Access the right_ as bare pointer, const. const RBNode* getRight() const { return (right_.get()); } RBNodeColor color_; //@} /// \brief Relative name of the node. isc::dns::Name name_; /// \brief Data stored here. NodeDataPtr data_; /// \brief The subdomain tree. /// /// This points to the root node of trees of subdomains of this domain. /// /// \par Adding down pointer to \c RBNode has two purposes: /// \li Accelerate the search process, with sub domain tree, it splits the /// big flat tree into several hierarchy trees. /// \li It saves memory usage as it allows storing only relative names, /// avoiding storage of the same domain labels multiple times. RBNodePtr down_; /// \brief Access the down_ as bare pointer. RBNode* getDown() { return (down_.get()); } /// \brief Access the down_ as bare pointer, const. const RBNode* getDown() const { return (down_.get()); } /// \brief If callback should be called when traversing this node in /// RBTree::find(). /// /// \todo It might be needed to put it into more general attributes field. uint32_t flags_; }; template RBNode::RBNode(const isc::dns::Name& name) : parent_(NULL), left_(NULL), right_(NULL), name_(name), down_(NULL), flags_(FLAG_RED | FLAG_SUBTREE_ROOT) { } template RBNode::~RBNode() { } template const RBNode* RBNode::getUpperNode() const { const RBNode* current = this; // current would never be equal to NULL here (in a correct tree // implementation) while (!current->isSubTreeRoot()) { current = current->getParent(); } return (current->getParent()); } template const RBNode* RBNode::abstractSuccessor(typename RBNode::RBNodePtr RBNode::*left, typename RBNode::RBNodePtr RBNode::*right) const { // This function is written as a successor. It becomes predecessor if // the left and right pointers are swapped. So in case of predecessor, // the left pointer points to right and vice versa. Don't get confused // by the idea, just imagine the pointers look into a mirror. const RBNode* current = this; // If it has right node, the successor is the left-most node of the right // subtree. if ((current->*right).get() != NULL) { current = (current->*right).get(); const RBNode* left_n; while ((left_n = (current->*left).get()) != NULL) { current = left_n; } return (current); } // Otherwise go up until we find the first left branch on our path to // root. If found, the parent of the branch is the successor. // Otherwise, we return the null node const RBNode* parent = current->getParent(); while ((!current->isSubTreeRoot()) && (current == (parent->*right).get())) { current = parent; parent = parent->getParent(); } if (!current->isSubTreeRoot()) { return (parent); } else { return (NULL); } } template const RBNode* RBNode::successor() const { return (abstractSuccessor(&RBNode::left_, &RBNode::right_)); } template const RBNode* RBNode::predecessor() const { // Swap the left and right pointers for the abstractSuccessor return (abstractSuccessor(&RBNode::right_, &RBNode::left_)); } /// \brief RBTreeNodeChain stores detailed information of \c RBTree::find() /// result. /// /// - The \c RBNode that was last compared with the search name, and /// the comparison result at that point in the form of /// \c isc::dns::NameComparisonResult. /// - A sequence of nodes that forms a path to the found node. /// /// The comparison result can be used to handle some rare cases such as /// empty node processing. /// The node sequence keeps track of the nodes to reach any given node from /// the root of RBTree. /// /// Currently, RBNode does not have "up" pointers in them (i.e., back pointers /// from the root of one level of tree of trees to the node in the parent /// tree whose down pointer points to that root node) for memory usage /// reasons, so there is no other way to find the path back to the root from /// any given RBNode. /// /// \note This design may change in future versions. In particular, it's /// quite likely we want to have that pointer if we want to optimize name /// compression by exploiting the structure of the zone. If and when that /// happens we should also revisit the need for the chaining. /// Also, the class name may not be appropriate now that it contains other /// information than a node "chain", and the chain itself may even be /// deprecated. Something like "RBTreeFindContext" may be a better name. /// This point should be revisited later. /// /// RBTreeNodeChain is constructed and manipulated only inside the \c RBTree /// class. /// \c RBTree uses it as an inner data structure to iterate over the whole /// RBTree. /// This is the reason why manipulation methods such as \c push() and \c pop() /// are private (and not shown in the doxygen document). template class RBTreeNodeChain { /// RBTreeNodeChain is initialized by RBTree, only RBTree has /// knowledge to manipulate it. friend class RBTree; public: /// \name Constructors and Assignment Operator. /// /// \note The copy constructor and the assignment operator are /// intentionally defined as private, making this class non copyable. /// This may have to be changed in a future version with newer need. /// For now we explicitly disable copy to avoid accidental copy happens /// unintentionally. //{@ /// The default constructor. /// /// \exception None RBTreeNodeChain() : node_count_(0), last_compared_(NULL), // XXX: meaningless initial values: last_comparison_(0, 0, isc::dns::NameComparisonResult::EQUAL) {} private: RBTreeNodeChain(const RBTreeNodeChain&); RBTreeNodeChain& operator=(const RBTreeNodeChain&); //@} public: /// Clear the state of the chain. /// /// This method re-initializes the internal state of the chain so that /// it can be reused for subsequent operations. /// /// \exception None void clear() { node_count_ = 0; last_compared_ = NULL; } /// Return the \c RBNode that was last compared in \c RBTree::find(). /// /// If this chain has been passed to \c RBTree::find() and there has /// been name comparison against the search name, the last compared /// \c RBNode is recorded within the chain. This method returns that /// node. /// If \c RBTree::find() hasn't been called with this chain or name /// comparison hasn't taken place (which is possible if the tree is empty), /// this method returns \c NULL. /// /// \exception None const RBNode* getLastComparedNode() const { return (last_compared_); } /// Return the result of last name comparison in \c RBTree::find(). /// /// Like \c getLastComparedNode(), \c RBTree::find() records the result /// of the last name comparison in the chain. This method returns the /// result. /// The return value of this method is only meaningful when comparison /// has taken place, i.e, when \c getLastComparedNode() would return a /// non \c NULL value. /// /// \exception None const isc::dns::NameComparisonResult& getLastComparisonResult() const { return (last_comparison_); } /// \brief Return the number of levels stored in the chain. /// /// It's equal to the number of nodes in the chain; for an empty /// chain, 0 will be returned. /// /// \exception None unsigned int getLevelCount() const { return (node_count_); } /// \brief return the absolute name for the node which this /// \c RBTreeNodeChain currently refers to. /// /// The chain must not be empty. /// /// \exception isc::BadValue the chain is empty. /// \exception std::bad_alloc memory allocation for the new name fails. isc::dns::Name getAbsoluteName() const { if (isEmpty()) { isc_throw(isc::BadValue, "RBTreeNodeChain::getAbsoluteName is called on an empty " "chain"); } const RBNode* top_node = top(); isc::dns::Name absolute_name = top_node->getName(); int node_count = node_count_ - 1; while (node_count > 0) { top_node = nodes_[node_count - 1]; absolute_name = absolute_name.concatenate(top_node->getName()); --node_count; } return (absolute_name); } private: // the following private functions check invariants about the internal // state using assert() instead of exception. The state of a chain // can only be modified by operations within this file, so if any of the // assumptions fails it means an internal bug. /// \brief return whether node chain has node in it. /// /// \exception None bool isEmpty() const { return (node_count_ == 0); } /// \brief return the top node for the node chain /// /// RBTreeNodeChain store all the nodes along top node to /// root node of RBTree /// /// \exception None const RBNode* top() const { assert(!isEmpty()); return (nodes_[node_count_ - 1]); } /// \brief pop the top node from the node chain /// /// After pop, up/super node of original top node will be /// the top node /// /// \exception None void pop() { assert(!isEmpty()); --node_count_; } /// \brief add the node into the node chain /// /// If the node chain isn't empty, the node should be /// the sub domain of the original top node in node chain /// otherwise the node should be the root node of RBTree. /// /// \exception None void push(const RBNode* node) { assert(node_count_ < RBT_MAX_LEVEL); nodes_[node_count_++] = node; } private: // The max label count for one domain name is Name::MAX_LABELS (128). // Since each node in rbtree stores at least one label, it's also equal // to the possible maximum level. const static int RBT_MAX_LEVEL = isc::dns::Name::MAX_LABELS; int node_count_; const RBNode* nodes_[RBT_MAX_LEVEL]; const RBNode* last_compared_; isc::dns::NameComparisonResult last_comparison_; }; // note: the following class description is documented using multiline comments // because the verbatim diagram contain a backslash, which could be interpreted // as escape of newline in singleline comment. /** * \brief \c RBTree class represents all the domains with the same suffix. * It can be used to store the domains in one zone, for example. * * RBTree is a generic map from domain names to any kind of data. Internally, * it uses a red-black tree. However, it isn't one tree containing everything. * Subdomains are trees, so this structure is recursive - trees inside trees. * But, from the interface point of view, it is opaque data structure. * * \c RBTree splits the domain space into hierarchy red black trees; nodes * in one tree has the same base name. The benefit of this struct is that: * - Enhances the query performace compared with one big flat red black tree. * - Decreases the memory footprint, as it doesn't store the suffix labels * multiple times. * * Depending on different usage, rbtree will support different search policies. * Whether to return an empty node to end user is one policy among them. * The default policy is to NOT return an empty node to end user; * to change the behavior, specify \c true for the constructor parameter * \c returnEmptyNode. * \note The search policy only affects the \c find() behavior of RBTree. * When inserting one name into RBTree, if the node with the name already * exists in the RBTree and it's an empty node which doesn't have any data, * the \c insert() method will still return \c ALREADYEXISTS regardless of * the search policy. * * \anchor diagram * * with the following names: * - a * - b * - c * - x.d.e.f * - z.d.e.f * - g.h * - o.w.y.d.e.f * - p.w.y.d.e.f * - q.w.y.d.e.f * * the tree will look like: * \verbatim b / \ a d.e.f /|\ c | g.h | w.y /|\ x | z | p / \ o q \endverbatim * \todo * - add remove interface * - add iterator to iterate over the whole \c RBTree. This may be necessary, * for example, to support AXFR. */ template class RBTree : public boost::noncopyable { friend class RBNode; public: /// \brief The return value for the \c find() and insert() methods enum Result { SUCCESS, ///< Insert was successful /// \brief The node returned from find mathes exactly the name given EXACTMATCH, PARTIALMATCH, ///< A superdomain node was found NOTFOUND, ///< Not even any superdomain was found /// \brief Returned by insert() if a node of the name already exists ALREADYEXISTS, }; /// \name Constructor and Destructor //@{ /// The constructor. /// /// It never throws an exception. explicit RBTree(bool returnEmptyNode = false); /// \b Note: RBTree is not intended to be inherited so the destructor /// is not virtual ~RBTree(); //@} /// \name Find methods /// /// \brief Find the node that gives a longest match against the given name. /// /// \anchor find /// /// These methods search the RBTree for a node whose name is longest /// against name. The found node, if any, is returned via the node pointer. /// /// By default, nodes that don't have data (see RBNode::isEmpty) are /// ignored and the result can be NOTFOUND even if there's a node whose /// name matches. If the \c RBTree is constructed with its /// \c returnEmptyNode parameter being \c true, empty nodes will also /// be match candidates. /// /// \note Even when \c returnEmptyNode is \c true, not all empty nodes /// in terms of the DNS protocol may necessarily be found by this method. /// For example, in the \ref diagram shown in the class description, /// the name y.d.e.f is logically contained in the tree as part of the /// node w.y, but the \c find() variants cannot find the former for /// the search key of y.d.e.f, no matter how the \c RBTree is constructed. /// The caller of this method must use a different way to identify the /// hidden match when necessary. /// /// These methods involve operations on names that can throw an exception. /// If that happens the exception will be propagated to the caller. /// The callback function should generally not throw an exception, but /// if it throws, the exception will be propagated to the caller. /// /// The \c name parameter says what should be found. The node parameter /// is output-only, and in case of EXACTMATCH or PARTIALMATCH, it is set /// to a pointer to the found node. /// /// They return: /// - EXACTMATCH when a node with the same name as requested exists. /// - PARTIALMATCH when a node with the same name does not exist (or is /// empty), but there's a (nonempty) superdomain of the requested one. /// The superdomain with longest name is returned through the node /// parameter. Beware that if you store a zone in the tree, you may get /// PARTIALMATCH with zone apex when the given domain name is not there. /// You should not try to delegate into another zone in that case. /// - NOTFOUND if there's no node with the same name nor any superdomain /// of it. In that case, node parameter is left intact. //@{ /// \brief Simple find. /// /// Acts as described in the \ref find section. Result find(const isc::dns::Name& name, RBNode** node) const { RBTreeNodeChain node_path; return (find(name, node, node_path, NULL, NULL)); } /// \brief Simple find returning immutable node. /// /// Acts as described in the \ref find section, but returns immutable node /// pointer. Result find(const isc::dns::Name& name, const RBNode** node) const { RBTreeNodeChain node_path; RBNode *target_node = NULL; Result ret = (find(name, &target_node, node_path, NULL, NULL)); if (ret != NOTFOUND) { *node = target_node; } return (ret); } /// \brief Simple find, with node_path tracking /// /// Acts as described in the \ref find section. Result find(const isc::dns::Name& name, RBNode** node, RBTreeNodeChain& node_path) const { return (find(name, node, node_path, NULL, NULL)); } /// \brief Simple find returning immutable node, with node_path tracking /// /// Acts as described in the \ref find section, but returns immutable node /// pointer. Result find(const isc::dns::Name& name, const RBNode** node, RBTreeNodeChain& node_path) const { RBNode *target_node = NULL; Result ret = (find(name, &target_node, node_path, NULL, NULL)); if (ret != NOTFOUND) { *node = target_node; } return (ret); } /// \brief Find with callback and node chain. /// \anchor callback /// /// This version of \c find() is specifically designed for the backend /// of the \c InMemoryZoneFinder class, and implements all necessary /// features for that purpose. Other applications shouldn't need these /// additional features, and should normally use the simpler versions. /// /// This version of \c find() calls the callback whenever traversing (on /// the way from root down the tree) a marked node on the way down through /// the domain namespace (see \c RBNode::FLAG_CALLBACK). /// /// If you return true from the callback, the search is stopped and a /// PARTIALMATCH is returned with the given node. Note that this node /// doesn't really need to be the one with longest possible match. /// /// The callback is not called for the node which matches exactly /// (EXACTMATCH is returned). This is typically the last node in the /// traversal during a successful search. /// /// This callback mechanism was designed with zone cut (delegation) /// processing in mind. The marked nodes would be the ones at delegation /// points. It is not expected that any other applications would need /// callbacks; they should use the versions of find without callbacks. /// The callbacks are not general functors for the same reason - we don't /// expect it to be needed. /// /// Another special feature of this version is the ability to record /// more detailed information regarding the search result. /// /// This information will be returned via the \c node_path parameter, /// which is an object of class \c RBTreeNodeChain. /// The passed parameter must be empty. /// /// On success, the node sequence stored in \c node_path will contain all /// the ancestor nodes from the found node towards the root. /// For example, if we look for o.w.y.d.e.f in the example \ref diagram, /// \c node_path will contain w.y and d.e.f; the \c top() node of the /// chain will be o, w.y and d.e.f will be stored below it. /// /// This feature can be used to get the absolute name for a node; /// to do so, we need to travel upside from the node toward the root, /// concatenating all ancestor names. With the current implementation /// it's not possible without a node chain, because there is a no pointer /// from the root of a subtree to the parent subtree (this may change /// in a future version). A node chain can also be used to find the /// next and previous nodes of a given node in the entire RBTree; /// the \c nextNode() and \c previousNode() methods take a node /// chain as a parameter. /// /// \exception isc::BadValue node_path is not empty. /// /// \param name Target to be found /// \param node On success (either \c EXACTMATCH or \c PARTIALMATCH) /// it will store a pointer to the matching node /// \param node_path Other search details will be stored (see the /// description) /// \param callback If non- \c NULL, a call back function to be called /// at marked nodes (see the description). /// \param callback_arg A caller supplied argument to be passed to /// \c callback. /// /// \return As in the description, but in case of callback returning /// \c true, it returns immediately with the current node. template Result find(const isc::dns::Name& name, RBNode** node, RBTreeNodeChain& node_path, bool (*callback)(const RBNode&, CBARG), CBARG callback_arg) const; /// \brief Simple find returning immutable node. /// /// Acts as described in the \ref find section, but returns immutable /// node pointer. template Result find(const isc::dns::Name& name, const RBNode** node, RBTreeNodeChain& node_path, bool (*callback)(const RBNode&, CBARG), CBARG callback_arg) const { RBNode* target_node = NULL; Result ret = find(name, &target_node, node_path, callback, callback_arg); if (ret != NOTFOUND) { *node = target_node; } return (ret); } //@} /// \brief return the next bigger node in DNSSEC order from a given node /// chain. /// /// This method identifies the next bigger node of the node currently /// referenced in \c node_path and returns it. /// This method also updates the passed \c node_path so that it will store /// the path for the returned next node. /// It will be convenient when we want to iterate over the all nodes /// of \c RBTree; we can do this by calling this method repeatedly /// starting from the root node. /// /// \note \c nextNode() will iterate over all the nodes in RBTree including /// empty nodes. If empty node isn't desired, it's easy to add logic to /// check return node and keep invoking \c nextNode() until the non-empty /// node is retrieved. /// /// \exception isc::BadValue node_path is empty. /// /// \param node_path A node chain that stores all the nodes along the path /// from root to node. /// /// \return An \c RBNode that is next bigger than \c node; if \c node is /// the largest, \c NULL will be returned. const RBNode* nextNode(RBTreeNodeChain& node_path) const; /// \brief return the next smaller node in DNSSEC order from a node /// searched by RBTree::find(). /// /// This acts similarly to \c nextNode(), but it walks in the other /// direction. But unlike \c nextNode(), this can start even if the /// node requested by \c find() was not found. In that case, it will /// identify the node that is previous to the queried name. /// /// \note \c previousNode() will iterate over all the nodes in RBTree /// including empty nodes. If empty node isn't desired, it's easy to add /// logic to check return node and keep invoking \c previousNode() until the /// non-empty node is retrieved. /// /// \exception isc::BadValue node_path is empty. /// /// \param node_path A node chain that stores all the nodes along the path /// from root to node and the result of \c find(). This will get modified. /// You should not use the node_path again except for repetitive calls /// of this method. /// /// \return An \c RBNode that is next smaller than \c node; if \c node is /// the smallest, \c NULL will be returned. const RBNode* previousNode(RBTreeNodeChain& node_path) const; /// \brief Get the total number of nodes in the tree /// /// It includes nodes internally created as a result of adding a domain /// name that is a subdomain of an existing node of the tree. /// This function is mainly intended to be used for debugging. int getNodeCount() const { return (node_count_); } /// \name Debug function //@{ /// \brief Print the nodes in the trees. /// /// \param os A \c std::ostream object to which the tree is printed. /// \param depth A factor of the initial indentation. Each line /// will begin with space character repeating 5 * depth /// times. void dumpTree(std::ostream& os, unsigned int depth = 0) const; /// \brief Print the nodes in the trees for processing with /// Graphviz's dot. /// /// \param os A \c std::ostream object to which the tree is printed. /// \param show_pointers Show node and parent pointers in the node void dumpDot(std::ostream& os, bool show_pointers = false) const; //@} /// \name Modify functions //@{ /// \brief Insert the domain name into the tree. /// /// It either finds an already existing node of the given name, or inserts /// a new one if none exists yet. In any case, the \c inserted_node parameter /// is set to point to that node. You can fill data into it or modify it. /// So, if you don't know if a node exists or not and you need to modify /// it, just call insert and act by the result. /// /// Please note that the tree can add some empty nodes by itself, so don't /// assume that if you didn't insert a node of that name it doesn't exist. /// /// This method normally involves resource allocation. If it fails /// the corresponding standard exception will be thrown. /// /// This method does not provide the strong exception guarantee in its /// strict sense; if an exception is thrown in the middle of this /// method, the internal structure may change. However, it should /// still retain the same property as a mapping container before this /// method is called. For example, the result of \c find() should be /// the same. This method provides the weak exception guarantee in its /// normal sense. /// /// \param name The name to be inserted into the tree. /// \param inserted_node This is an output parameter and is set to the /// node. /// /// \return /// - SUCCESS The node was added. /// - ALREADYEXISTS There was already a node of that name, so it was not /// added. Result insert(const isc::dns::Name& name, RBNode** inserted_node); /// \brief Swaps two tree's contents. /// /// This acts the same as many std::*.swap functions, exchanges the /// contents. This doesn't throw anything. void swap(RBTree& other) { std::swap(root_, other.root_); std::swap(node_count_, other.node_count_); } //@} private: /// \name RBTree balance functions //@{ void insertRebalance(typename RBNode::RBNodePtr* root, RBNode* node); RBNode* rightRotate(typename RBNode::RBNodePtr* root, RBNode* node); RBNode* leftRotate(typename RBNode::RBNodePtr* root, RBNode* node); //@} /// \name Helper functions //@{ /// \brief delete tree whose root is equal to node void deleteHelper(RBNode *node); /// \brief Print the information of given RBNode. void dumpTreeHelper(std::ostream& os, const RBNode* node, unsigned int depth) const; /// \brief Print the information of given RBNode for dot. int dumpDotHelper(std::ostream& os, const RBNode* node, int* nodecount, bool show_pointers) const; /// \brief Indentation helper function for dumpTree static void indent(std::ostream& os, unsigned int depth); /// Split one node into two nodes, keep the old node and create one new /// node, old node will hold the base name, new node will be the down node /// of old node, new node will hold the sub_name, the data /// of old node will be move into new node, and old node became non-terminal void nodeFission(RBNode& node, const isc::dns::Name& sub_name); //@} typename RBNode::RBNodePtr root_; /// the node count of current tree unsigned int node_count_; /// search policy for rbtree const bool needsReturnEmptyNode_; }; template RBTree::RBTree(bool returnEmptyNode) : root_(NULL), node_count_(0), needsReturnEmptyNode_(returnEmptyNode) { } template RBTree::~RBTree() { deleteHelper(root_.get()); assert(node_count_ == 0); } template void RBTree::deleteHelper(RBNode* root) { if (root == NULL) { return; } RBNode* node = root; while (root->getLeft() != NULL || root->getRight() != NULL) { RBNode* left(NULL); RBNode* right(NULL); while ((left = node->getLeft()) != NULL || (right = node->getRight()) != NULL) { node = (left != NULL) ? left : right; } RBNode* parent = node->getParent(); if (parent->getLeft() == node) { parent->left_ = NULL; } else { parent->right_ = NULL; } deleteHelper(node->getDown()); delete node; --node_count_; node = parent; } deleteHelper(root->getDown()); delete root; --node_count_; } template template typename RBTree::Result RBTree::find(const isc::dns::Name& target_name, RBNode** target, RBTreeNodeChain& node_path, bool (*callback)(const RBNode&, CBARG), CBARG callback_arg) const { using namespace helper; if (!node_path.isEmpty()) { isc_throw(isc::BadValue, "RBTree::find is given a non empty chain"); } RBNode* node = root_.get(); Result ret = NOTFOUND; isc::dns::Name name = target_name; while (node != NULL) { node_path.last_compared_ = node; node_path.last_comparison_ = name.compare(node->name_); const isc::dns::NameComparisonResult::NameRelation relation = node_path.last_comparison_.getRelation(); if (relation == isc::dns::NameComparisonResult::EQUAL) { if (needsReturnEmptyNode_ || !node->isEmpty()) { node_path.push(node); *target = node; ret = EXACTMATCH; } break; } else { const int common_label_count = node_path.last_comparison_.getCommonLabels(); // If the common label count is 1, there is no common label between // the two names, except the trailing "dot". In this case the two // sequences of labels have essentially no hierarchical // relationship in terms of matching, so we should continue the // binary search. One important exception is when the node // represents the root name ("."), in which case the comparison // result must indeed be considered subdomain matching. (We use // getLength() to check if the name is root, which is an equivalent // but cheaper way). if (common_label_count == 1 && node->name_.getLength() != 1) { node = (node_path.last_comparison_.getOrder() < 0) ? node->getLeft() : node->getRight(); } else if (relation == isc::dns::NameComparisonResult::SUBDOMAIN) { if (needsReturnEmptyNode_ || !node->isEmpty()) { ret = PARTIALMATCH; *target = node; if (callback != NULL && node->getFlag(RBNode::FLAG_CALLBACK)) { if ((callback)(*node, callback_arg)) { break; } } } node_path.push(node); name = name - node->name_; node = node->getDown(); } else { break; } } } return (ret); } template const RBNode* RBTree::nextNode(RBTreeNodeChain& node_path) const { if (node_path.isEmpty()) { isc_throw(isc::BadValue, "RBTree::nextNode is given an empty chain"); } const RBNode* node = node_path.top(); // if node has sub domain, the next domain is the smallest // domain in sub domain tree const RBNode* down = node->getDown(); if (down != NULL) { const RBNode* left_most = down; while (left_most->getLeft() != NULL) { left_most = left_most->getLeft(); } node_path.push(left_most); return (left_most); } // try to find a successor. // if no successor found move to up level, the next successor // is the successor of up node in the up level tree, if // up node doesn't have successor we gonna keep moving to up // level while (!node_path.isEmpty()) { const RBNode* up_node_successor = node_path.top()->successor(); node_path.pop(); if (up_node_successor != NULL) { node_path.push(up_node_successor); return (up_node_successor); } } return (NULL); } template const RBNode* RBTree::previousNode(RBTreeNodeChain& node_path) const { if (getNodeCount() == 0) { // Special case for empty trees. It would look every time like // we didn't search, because the last compared is empty. This is // a slight hack and not perfect, but this is better than throwing // on empty tree. And we probably won't meet an empty tree in practice // anyway. return (NULL); } if (node_path.last_compared_ == NULL) { isc_throw(isc::BadValue, "RBTree::previousNode() called before find()"); } // If the relation isn't EQUAL, it means the find was called previously // and didn't find the exact node. Therefore we need to locate the place // to start iterating the chain of domains. // // The logic here is not too complex, we just need to take care to handle // all the cases and decide where to go from there. switch (node_path.last_comparison_.getRelation()) { case dns::NameComparisonResult::COMMONANCESTOR: // We compared with a leaf in the tree and wanted to go to one of // the children. But the child was not there. It now depends on the // direction in which we wanted to go. if (node_path.last_comparison_.getOrder() < 0) { // We wanted to go left. So the one we compared with is // the one higher than we wanted. If we just put it into // the node_path, then the following algorithm below will find // the smaller one. // // This is exactly the same as with superdomain below. // Therefore, we just fall through to the next case. } else { // We wanted to go right. That means we want to output the // one which is the largest in the tree defined by the // compared one (it is either the compared one, or some // subdomain of it). There probably is not an easy trick // for this, so we just find the correct place. const RBNode* current(node_path.last_compared_); while (current != NULL) { node_path.push(current); // Go a level down and as much right there as possible current = current->getDown(); if (current != NULL) { const RBNode* right; while ((right = current->getRight()) != NULL) { current = right; } } } // Now, the one on top of the path is the one we want. We // return it now and leave it there, so we can search for // previous of it the next time we'are called. node_path.last_comparison_ = dns::NameComparisonResult(0, 0, dns::NameComparisonResult::EQUAL); return (node_path.top()); } // No break; here - we want to fall through. See above. case dns::NameComparisonResult::SUPERDOMAIN: // This is the case there's a "compressed" node and we looked for // only part of it. The node itself is larger than we wanted, but // if we put it to the node_path and then go one step left from it, // we get the correct result. node_path.push(node_path.last_compared_); // Correct the comparison result, so we won't trigger this case // next time previousNode is called. We already located the correct // place to start. The value is partly nonsense, but that doesn't // matter any more. node_path.last_comparison_ = dns::NameComparisonResult(0, 0, dns::NameComparisonResult::EQUAL); break; case dns::NameComparisonResult::SUBDOMAIN: // A subdomain means we returned the one above the searched one // already and it is on top of the stack. This is was smaller // than the one already, but we want to return yet smaller one. // So we act as if it was EQUAL. break; case dns::NameComparisonResult::EQUAL: // The find gave us an exact match or the previousNode was called // already, which located the exact node. The rest of the function // goes one domain left and returns it for us. break; default: // This must not happen as Name::compare() never returns NONE. isc_throw(isc::Unexpected, "Name::compare() returned unexpected result"); } // So, the node_path now contains the path to a node we want previous for. // We just need to go one step left. if (node_path.isEmpty()) { // We got past the first one. So, we're returning NULL from // now on. return (NULL); } const RBNode* node(node_path.top()); // Try going left in this tree node = node->predecessor(); if (node == NULL) { // We are the smallest ones in this tree. We go one level // up. That one is the smaller one than us. node_path.pop(); if (node_path.isEmpty()) { // We're past the first one return (NULL); } else { return (node_path.top()); } } // Exchange the node at the top of the path, as we move horizontaly // through the domain tree node_path.pop(); node_path.push(node); // Try going as deep as possible, keeping on the right side of the trees const RBNode* down; while ((down = node->getDown()) != NULL) { // Move to the tree below node = down; if (node != NULL) { // And get as much to the right of the tree as possible const RBNode* right; while ((right = node->getRight()) != NULL) { node = right; } } // Now, we found the right-most node in the sub-tree, we need to // include it in the path node_path.push(node); } // Now, if the current node has no down_ pointer any more, it's the // correct one. return (node); } template typename RBTree::Result RBTree::insert(const isc::dns::Name& target_name, RBNode** new_node) { using namespace helper; RBNode* parent = NULL; RBNode* current = root_.get(); RBNode* up_node = NULL; isc::dns::Name name = target_name; int order = -1; while (current != NULL) { const isc::dns::NameComparisonResult compare_result = name.compare(current->name_); const isc::dns::NameComparisonResult::NameRelation relation = compare_result.getRelation(); if (relation == isc::dns::NameComparisonResult::EQUAL) { if (new_node != NULL) { *new_node = current; } return (ALREADYEXISTS); } else { const int common_label_count = compare_result.getCommonLabels(); // Note: see find() for the check of getLength(). if (common_label_count == 1 && current->name_.getLength() != 1) { parent = current; order = compare_result.getOrder(); current = order < 0 ? current->getLeft() : current->getRight(); } else { // insert sub domain to sub tree if (relation == isc::dns::NameComparisonResult::SUBDOMAIN) { parent = NULL; up_node = current; name = name - current->name_; current = current->getDown(); } else { // The number of labels in common is fewer // than the number of labels at the current // node, so the current node must be adjusted // to have just the common suffix, and a down // pointer made to a new tree. const isc::dns::Name common_ancestor = name.split( name.getLabelCount() - common_label_count, common_label_count); nodeFission(*current, common_ancestor); } } } } typename RBNode::RBNodePtr* current_root = (up_node != NULL) ? &(up_node->down_) : &root_; // using auto_ptr here is avoid memory leak in case of exceptoin raised // after the RBNode creation, if we can make sure no exception will be // raised until the end of the function, we can remove it for optimization std::auto_ptr > node(new RBNode(name)); node->parent_ = parent; if (parent == NULL) { *current_root = node.get(); //node is the new root of sub tree, so its init color // is BLACK node->setColor(RBNode::BLACK); node->setSubTreeRoot(true); node->parent_ = up_node; } else if (order < 0) { node->setSubTreeRoot(false); parent->left_ = node.get(); } else { node->setSubTreeRoot(false); parent->right_ = node.get(); } insertRebalance(current_root, node.get()); if (new_node != NULL) { *new_node = node.get(); } ++node_count_; node.release(); return (SUCCESS); } // Note: when we redesign this (still keeping the basic concept), we should // change this part so the newly created node will be used for the inserted // name (and therefore the name for the existing node doesn't change). // Otherwise, things like shortcut links between nodes won't work. template void RBTree::nodeFission(RBNode& node, const isc::dns::Name& base_name) { using namespace helper; const isc::dns::Name sub_name = node.name_ - base_name; // using auto_ptr here is to avoid memory leak in case of exception raised // after the RBNode creation std::auto_ptr > down_node(new RBNode(sub_name)); node.name_ = base_name; // the rest of this function should be exception free so that it keeps // consistent behavior (i.e., a weak form of strong exception guarantee) // even if code after the call to this function throws an exception. bool is_root = node.isSubTreeRoot(); std::swap(node.data_, down_node->data_); std::swap(node.flags_, down_node->flags_); node.setSubTreeRoot(is_root); down_node->down_ = node.getDown(); if (down_node->down_ != NULL) { down_node->down_->parent_ = down_node.get(); } node.down_ = down_node.get(); down_node->parent_ = &node; // Restore the color of the node (may have gotten changed by the flags swap) node.setColor(down_node->getColor()); // root node of sub tree, the initial color is BLACK down_node->setColor(RBNode::BLACK); // mark it as the root of a subtree down_node->setSubTreeRoot(true); ++node_count_; down_node.release(); } template void RBTree::insertRebalance(typename RBNode::RBNodePtr* root, RBNode* node) { RBNode* uncle; RBNode* parent; while (node != (*root).get() && (parent = node->getParent())->getColor() == RBNode::RED) { if (parent == parent->getParent()->getLeft()) { uncle = parent->getParent()->getRight(); if (uncle != NULL && uncle->getColor() == RBNode::RED) { parent->setColor(RBNode::BLACK); uncle->setColor(RBNode::BLACK); parent->getParent()->setColor(RBNode::RED); node = parent->getParent(); } else { if (node == parent->getRight()) { node = parent; leftRotate(root, node); parent = node->getParent(); } parent->setColor(RBNode::BLACK); parent->getParent()->setColor(RBNode::RED); rightRotate(root, parent->getParent()); } } else { uncle = parent->getParent()->getLeft(); if (uncle != NULL && uncle->getColor() == RBNode::RED) { parent->setColor(RBNode::BLACK); uncle->setColor(RBNode::BLACK); parent->getParent()->setColor(RBNode::RED); node = parent->getParent(); } else { if (node == parent->getLeft()) { node = parent; rightRotate(root, node); parent = node->getParent(); } parent->setColor(RBNode::BLACK); parent->getParent()->setColor(RBNode::RED); leftRotate(root, parent->getParent()); } } } (*root)->setColor(RBNode::BLACK); } template RBNode* RBTree::leftRotate(typename RBNode::RBNodePtr* root, RBNode* node) { RBNode* const right = node->getRight(); RBNode* const rleft = right->getLeft(); node->right_ = rleft; if (rleft != NULL) { rleft->parent_ = node; } RBNode* const parent = node->getParent(); right->parent_ = parent; if (!node->isSubTreeRoot()) { right->setSubTreeRoot(false); if (node == parent->getLeft()) { parent->left_ = right; } else { parent->right_ = right; } } else { right->setSubTreeRoot(true); *root = right; } right->left_ = node; node->parent_ = right; node->setSubTreeRoot(false); return (node); } template RBNode* RBTree::rightRotate(typename RBNode::RBNodePtr* root, RBNode* node) { RBNode* const left = node->getLeft(); RBNode* const lright = left->getRight(); node->left_ = lright; if (lright != NULL) { lright->parent_ = node; } RBNode* const parent = node->getParent(); left->parent_ = parent; if (!node->isSubTreeRoot()) { left->setSubTreeRoot(false); if (node == parent->getRight()) { parent->right_ = left; } else { parent->left_ = left; } } else { left->setSubTreeRoot(true); *root = left; } left->right_ = node; node->parent_ = left; node->setSubTreeRoot(false); return (node); } template void RBTree::dumpTree(std::ostream& os, unsigned int depth) const { indent(os, depth); os << "tree has " << node_count_ << " node(s)\n"; dumpTreeHelper(os, root_.get(), depth); } template void RBTree::dumpTreeHelper(std::ostream& os, const RBNode* node, unsigned int depth) const { if (node == NULL) { indent(os, depth); os << "NULL\n"; return; } indent(os, depth); os << node->name_.toText() << " (" << ((node->getColor() == RBNode::BLACK) ? "black" : "red") << ")"; if (node->isEmpty()) { os << " [invisible]"; } if (node->isSubTreeRoot()) { os << " [subtreeroot]"; } os << "\n"; const RBNode* down = node->getDown(); if (down != NULL) { indent(os, depth + 1); os << "begin down from " << node->name_.toText() << "\n"; dumpTreeHelper(os, down, depth + 1); indent(os, depth + 1); os << "end down from " << node->name_.toText() << "\n"; } dumpTreeHelper(os, node->getLeft(), depth + 1); dumpTreeHelper(os, node->getRight(), depth + 1); } template void RBTree::indent(std::ostream& os, unsigned int depth) { static const unsigned int INDENT_FOR_EACH_DEPTH = 5; os << std::string(depth * INDENT_FOR_EACH_DEPTH, ' '); } template void RBTree::dumpDot(std::ostream& os, bool show_pointers) const { int nodecount = 0; os << "digraph g {\n"; os << "node [shape = record,height=.1];\n"; dumpDotHelper(os, root_, &nodecount, show_pointers); os << "}\n"; } template int RBTree::dumpDotHelper(std::ostream& os, const RBNode* node, int* nodecount, bool show_pointers) const { if (node == NULL) { return 0; } int l = dumpDotHelper(os, node->getLeft(), nodecount, show_pointers); int r = dumpDotHelper(os, node->getRight(), nodecount, show_pointers); int d = dumpDotHelper(os, node->getDown(), nodecount, show_pointers); *nodecount += 1; os << "node" << *nodecount << "[label = \" | " << node->name_.toText() << "|"; if (show_pointers) { os << "| n=" << node << "| p=" << node->parent_; } os << "\"] ["; if (node->getColor() == RBNode::RED) { os << "color=red"; } else { os << "color=black"; } if (node->isSubTreeRoot()) { os << ",penwidth=3"; } if (node->isEmpty()) { os << ",style=filled,fillcolor=lightgrey"; } os << "];\n"; if (node->getLeft() != NULL) { os << "\"node" << *nodecount << "\":f0 -> \"node" << l << "\":f1;\n"; } if (node->getDown() != NULL) { os << "\"node" << *nodecount << "\":f1 -> \"node" << d << "\":f1 [penwidth=5];\n"; } if (node->getRight() != NULL) { os << "\"node" << *nodecount << "\":f2 -> \"node" << r << "\":f1;\n"; } return (*nodecount); } } } #endif // _RBTREE_H // Local Variables: // mode: c++ // End: