查找树--RadixTree【基数树】原理图解及示例代码

最新推荐文章于 2024-08-26 02:44:41 发布

enjoy编程

最新推荐文章于 2024-08-26 02:44:41 发布

阅读量5.2k

点赞数 5

分类专栏：算法文章标签：基数数 RadixTree Trie 原理源码示例

本文链接：https://blog.csdn.net/penriver/article/details/121082106

版权

算法专栏收录该内容

29 篇文章 6 订阅

订阅专栏

基数树

概念

RadixTree：基数树，或称压缩前缀树，是一种更节省空间的Trie。

基数树是Trie的压缩版本【compact version】。
在空间利用上更有效
- Trie因为通常在一条边中只存储1个字符，所以空间利用效率低下。
- 基数树利用了这一点，将在边中存储多个字符/文本字符串，以减少所需的额外边和节点的数量，同时仍然保持相同的表示意义和Trie的性能。
在最坏的情况下一个基数树将是一个Trie。

基数树示例如下：
在这里插入图片描述

树操作

插入过程

注意：如果插入的字符串和已经有边有共同的前缀，则需要将共同的前缀提升作为边，不同的部分作为新增节点的2条边

每个节点都可以有边，并且有一个标志来表明它是否是一个单词的结束。
每条边都有一串字符和它通向的一个节点

查找

查找示例如下：
在这里插入图片描述

删除

惰性删除：即沿着路径查找到叶节点后，直接删除叶节点，中间的非叶节点不删除
非惰性删除：将删除后只有一条边的顶点向上合并
详见代码实现

源码示例

import java.util.HashMap;
class RadixTreeTest {
    public static void main(String[] args) {
        RadixTree tree = new RadixTree();
        tree.insert("test");
        tree.insert("water");
        tree.insert("slow");
        tree.insert("slower");
        tree.insert("team");
        tree.insert("tester");
        tree.insert("t");
        tree.insert("toast");

        System.out.println(tree.search("te"));
        tree.printAllWords();

        tree.delete("test");

        System.out.println(tree.search("te"));
        tree.printAllWords();
    }
}

public class RadixTree {
    private static final int NO_MISMATCH = -1;
    private Node root;

    public RadixTree() {
        root = new Node(false);
    }

    public void insert(String word) {
        Node current = root;
        int currIndex = 0;

        //Iterative approach
        while (currIndex < word.length()) {
            char transitionChar = word.charAt(currIndex);
            Edge currentEdge = current.getTransition(transitionChar);
            //Updated version of the input word
            String currStr = word.substring(currIndex);

            //There is no associated edge with the first character of the current string
            //so simply add the rest of the string and finish
            if (currentEdge == null) {
                current.edges.put(transitionChar, new Edge(currStr));
                break;
            }

            int splitIndex = getFirstMismatchLetter(currStr, currentEdge.label);
            if (splitIndex == NO_MISMATCH) {
                //The edge and leftover string are the same length
                //so finish and update the next node as a word node
                if (currStr.length() == currentEdge.label.length()) {
                    currentEdge.next.isLeaf = true;
                    break;
                } else if (currStr.length() < currentEdge.label.length()) {
                    //The leftover word is a prefix to the edge string, so split
                    String suffix = currentEdge.label.substring(currStr.length());
                    currentEdge.label = currStr;
                    Node newNext = new Node(true);
                    Node afterNewNext = currentEdge.next;
                    currentEdge.next = newNext;
                    newNext.addEdge(suffix, afterNewNext);
                    break;
                } else { //currStr.length() > currentEdge.label.length()
                    //There is leftover string after a perfect match
                    splitIndex = currentEdge.label.length();
                }
            } else {
                //The leftover string and edge string differed, so split at point
                String suffix = currentEdge.label.substring(splitIndex);
                currentEdge.label = currentEdge.label.substring(0, splitIndex);
                Node prevNext = currentEdge.next;
                currentEdge.next = new Node(false);
                currentEdge.next.addEdge(suffix, prevNext);
            }

            //Traverse the tree
            current = currentEdge.next;
            currIndex += splitIndex;
        }
    }

    public boolean search(String word) {
        Node current = root;
        int currIndex = 0;
        while (currIndex < word.length()) {
            char transitionChar = word.charAt(currIndex);
            Edge edge = current.getTransition(transitionChar);
            if (edge == null) {
                return false;
            }

            String currSubstring = word.substring(currIndex);
            if (!currSubstring.startsWith(edge.label)) {
                return false;
            }
            currIndex += edge.label.length();
            current = edge.next;
        }

        return current.isLeaf;
    }

    public void delete(String word) {
        root = delete(root, word);
    }

    private Node delete(Node current, String word) {
        //base case, all the characters have been matched from previous checks
        if (word.isEmpty()) {
            //Has no other edges,
            if (current.edges.isEmpty() && current != root) {
                return null;
            }
            current.isLeaf = false;
            return current;
        }

        char transitionChar = word.charAt(0);
        Edge edge = current.getTransition(transitionChar);
        //Has no edge for the current word or the word doesn't exist
        if (edge == null || !word.startsWith(edge.label)) {
            return current;
        }

        Node deleted = delete(edge.next, word.substring(edge.label.length()));
        if (deleted == null) {
            current.edges.remove(transitionChar);
            if (current.totalEdges() == 0 && !current.isLeaf && current != root) {
                return null;
            }
        } else if (deleted.totalEdges() == 1 && !deleted.isLeaf) {
            current.edges.remove(transitionChar);
            for (Edge afterDeleted : deleted.edges.values()) {
                current.addEdge(edge.label + afterDeleted.label, afterDeleted.next);
            }
        }
        return current;
    }

    private int getFirstMismatchLetter(String word, String edgeWord) {
        int LENGTH = Math.min(word.length(), edgeWord.length());
        for (int i = 1; i < LENGTH; i++) {
            if (word.charAt(i) != edgeWord.charAt(i)) {
                return i;
            }
        }
        return NO_MISMATCH;
    }

    public void printAllWords() {
        printAllWords(root, "");
    }

    private void printAllWords(Node current, String result) {
        if (current.isLeaf) {
            System.out.print(result+",");
        }

        for (Edge edge : current.edges.values()) {
            printAllWords(edge.next, result + edge.label);
        }
    }


    private class Node {
        private boolean isLeaf;
        private HashMap<Character, Edge> edges;

        public Node(boolean isLeaf) {
            this.isLeaf = isLeaf;
            edges = new HashMap<>();
        }

        public Edge getTransition(char transitionChar) {
            return edges.get(transitionChar);
        }

        public void addEdge(String label, Node next) {
            edges.put(label.charAt(0), new Edge(label, next));
        }

        public int totalEdges() {
            return edges.size();
        }
    }

    private class Edge {
        private String label;
        private Node next;

        public Edge(String label) {
            this(label, new Node(true));
        }

        public Edge(String label, Node next) {
            this.label = label;
            this.next = next;
        }
    }
}