我有500w個單詞，你幫忙設計一個數據結構來進行儲存，存好之後，我有兩個需求。（程式人生程式碼copy）

阿新 • • 發佈：2018-12-15

1、來了一個新的單詞，需要判斷是否在這500w個單詞中

2、來了一個單詞字首，給出500w個單詞中有多少個單詞是該字首

package cango.scf.common.util;

import java.util.HashMap;
import java.util.Map;

public class DictionaryTree {
    // 字典樹的節點
    private class Node {
        // 是否是單詞
        private boolean isWord;
        // 單詞計數
        private int count;
        // 字串
        private String str;
        // 子節點
        private Map<String, Node> childs;
        // 父節點
        private Node parent;

        public Node() {
            childs = new HashMap<String, Node>();
        }

        public Node(boolean isWord, int count, String str) {
            this();
            this.isWord = isWord;
            this.count = count;
            this.str = str;
        }

        public void addChild(String key, Node node) {
            childs.put(key, node);
            node.parent = this;
        }

        public void removeChild(String key) {
            childs.remove(key);
        }

        public String toString() {
            return "str : " + str + ", isWord : " + isWord + ", count : " + count;
        }
    }

    // 字典樹根節點
    private Node root;

    DictionaryTree() {
        // 初始化root
        root = new Node();
    }

    // 新增字串
    private void addStr(String word, Node node) {

        // 計數
        node.count++;

        String str = node.str;
        if (null != str) {

            // 尋找公共字首
            String commonPrefix = "";
            for (int i = 0; i < word.length(); i++) {
                if (str.length() > i && word.charAt(i) == str.charAt(i)) {
                    commonPrefix += word.charAt(i);
                } else {
                    break;
                }
            }

            // 找到公共字首
            if (commonPrefix.length() > 0) {
                if (commonPrefix.length() == str.length() && commonPrefix.length() == word.length()) {
                    // 與之前的詞重複
                } else if (commonPrefix.length() == str.length() && commonPrefix.length() < word.length()) {
                    // 剩餘的串
                    String wordLeft = word.substring(commonPrefix.length());
                    // 剩餘的串去子節點中繼續找
                    searchChild(wordLeft, node);
                } else if (commonPrefix.length() < str.length()) {
                    // 節點裂變
                    Node splitNode = new Node(true, node.count, commonPrefix);
                    // 處理裂變節點的父關係
                    splitNode.parent = node.parent;
                    splitNode.parent.addChild(commonPrefix, splitNode);
                    node.parent.removeChild(node.str);
                    node.count--;
                    // 節點裂變後的剩餘字串
                    String strLeft = str.substring(commonPrefix.length());
                    node.str = strLeft;
                    splitNode.addChild(strLeft, node);
                    // 單詞裂變後的剩餘字串
                    if (commonPrefix.length() < word.length()) {
                        splitNode.isWord = false;
                        String wordLeft = word.substring(commonPrefix.length());
                        Node leftNode = new Node(true, 1, wordLeft);
                        splitNode.addChild(wordLeft, leftNode);
                    }
                }
            } else {
                // 沒有共同字首，直接新增節點
                Node newNode = new Node(true, 1, word);
                node.addChild(word, newNode);
            }
        } else {
            // 根結點
            if (node.childs.size() > 0) {
                searchChild(word, node);
            } else {
                Node newNode = new Node(true, 1, word);
                node.addChild(word, newNode);
            }
        }
    }

    // 在子節點中新增字串
    public void searchChild(String wordLeft, Node node) {
        boolean isFind = false;
        if (node.childs.size() > 0) {
            // 遍歷孩子
            for (String childKey : node.childs.keySet()) {
                Node childNode = node.childs.get(childKey);
                // 首字母相同，則在該子節點繼續新增字串
                if (wordLeft.charAt(0) == childNode.str.charAt(0)) {
                    isFind = true;
                    addStr(wordLeft, childNode);
                    break;
                }
            }
        }
        // 沒有首字母相同的孩子，則將其變為子節點
        if (!isFind) {
            Node newNode = new Node(true, 1, wordLeft);
            node.addChild(wordLeft, newNode);
        }
    }

    // 新增單詞
    public void add(String word) {
        addStr(word, root);
    }

    // 在節點中查詢字串
    private boolean findStr(String word, Node node) {
        boolean isMatch = true;
        String wordLeft = word;
        String str = node.str;
        if (null != str) {
            // 字串與單詞不匹配
            if (word.indexOf(str) != 0) {
                isMatch = false;
            } else {
                // 匹配，則計算剩餘單詞
                wordLeft = word.substring(str.length());
            }
        }
        // 如果匹配
        if (isMatch) {
            // 如果還有剩餘單詞長度
            if (wordLeft.length() > 0) {
                // 遍歷孩子繼續找
                for (String key : node.childs.keySet()) {
                    Node childNode = node.childs.get(key);
                    boolean isChildFind = findStr(wordLeft, childNode);
                    if (isChildFind) {
                        return true;
                    }
                }
                return false;
            } else {
                // 沒有剩餘單詞長度，說明已經匹配完畢，直接返回節點是否為單詞
                return node.isWord;
            }
        }
        return false;
    }

    // 查詢單詞
    public boolean find(String word) {
        return findStr(word, root);
    }

    // 統計子節點字串單詞數
    private int countChildStr(String prefix, Node node) {
        // 遍歷孩子
        for (String key : node.childs.keySet()) {
            Node childNode = node.childs.get(key);
            // 匹配子節點
            int childCount = countStr(prefix, childNode);
            if (childCount != 0) {
                return childCount;
            }
        }
        return 0;
    }

    // 統計字串單詞數
    private int countStr(String prefix, Node node) {
        String str = node.str;
        // 非根結點
        if (null != str) {
            // 字首與字串不匹配
            if (prefix.indexOf(str) != 0 && str.indexOf(prefix) != 0) {
                return 0;
                // 字首匹配字串，且字首較短
            } else if (str.indexOf(prefix) == 0) {
                // 找到目標節點，返回單詞數
                return node.count;
                // 字首匹配字串，且字串較短
            } else if (prefix.indexOf(str) == 0) {
                // 剩餘字串繼續匹配子節點
                String prefixLeft = prefix.substring(str.length());
                if (prefixLeft.length() > 0) {
                    return countChildStr(prefixLeft, node);
                }
            }
        } else {
            // 根結點，直接找其子孫
            return countChildStr(prefix, node);
        }
        return 0;
    }

    // 統計字首單詞數
    public int count(String prefix) {
        // 處理特殊情況
        if (null == prefix || prefix.trim().isEmpty()) {
            return root.count;
        }
        // 從根結點往下匹配
        return countStr(prefix, root);
    }

    // 列印節點
    private void printNode(Node node, int layer) {
        // 層級遞進
        for (int i = 0; i < layer; i++) {
            System.out.print("\t");
        }
        // 列印
        System.out.println(node);
        // 遞迴列印子節點
        for (String str : node.childs.keySet()) {
            Node child = node.childs.get(str);
            printNode(child, layer + 1);
        }
    }

    // 列印字典樹
    public void print() {
        printNode(root, 0);
    }

}

package cango.scf.common.util;

public class DictionaryTreeMain {

    public static void main(String[] args) {

        DictionaryTree dt = new DictionaryTree();

        dt.add("interest");
        dt.add("interesting");
        dt.add("interested");
        dt.add("inside");
        dt.add("insert");
        dt.add("apple");
        dt.add("inter");
        dt.add("interesting");
        dt.print();

        boolean isFind = dt.find("inside");
        System.out.println("find inside : " + isFind);

        int count = dt.count("inter");
        System.out.println("count prefix inter : " + count);

    }
}

我有500w個單詞，你幫忙設計一個數據結構來進行儲存，存好之後，我有兩個需求。（程式人生程式碼copy）

1、來了一個新的單詞，需要判斷是否在這500w個單詞中 2、來了一個單詞字首，給出500w個單詞中有多少個單詞是該字首 package cango.scf.common.util; import java.util.HashMap; import java.util.

如果系統要使用超大整數（超過long長度範圍），請你設計一個數據結構來儲存這種超大型數字以及設計一種演算法來實現超大整數加法運算）

/** * 超大整數相加： * 題目要求：如果系統要使用超大整數（超過long的範圍），請你設計一個數據結構來儲存這種 * 超大型數字以及設計一種演算法來實現超大整數的加法運算 * @author Administrator * */ p

統計一個數據庫內所有表的記錄條數總和，統計一個數據庫中有多少張表的SQL語句

--統計一個數據庫內所有表的記錄條數總和select SUM(rowcounts)from (SELECT OBJECT_NAME(id) AS [TBName],MAX(rowcnt)[rowcounts] FROM sys.sysindexes GROUP B

操作系統-文件目錄（又發現一個數據結構）

spa 文件目錄 height 數據結構 png 操作系統 src title 技術分享另外一種回答 ——————————————————- 操作系統-文件目錄（又發現一個數據結構）

Django：Error: [WinError 10013] 以一種訪問許可權不允許的方式做了一個訪問套接字的嘗試。（殺佔用埠程序）

Error: [WinError 10013] 以一種訪問許可權不允許的方式做了一個訪問套接字的嘗試。 1.啟動伺服器的時候提示埠被佔用，Error: [WinError 10013] 以一種訪問許可權不允許的方式做了一個訪問套接字的嘗試。解決方案 1.查找出被佔用的

為什麼說，隨波逐流是成為一個數據科學英雄最大的阻礙

如果你集齊演算法，業務，計算機知識這三顆龍珠，那麼你就可以召喚一個小一點兒的“神龍”了。但是想要召喚全能“神龍”，除了技術過硬之外，你還需要過硬的獨立思考能力和洞察力。我們如何才能才能擁有獨立思考能力呢？不隨波逐流！有著豐富的資

每天一個數據結構----佇列的順序儲存結構實現（純程式碼）

每天一個數據結構----棧的鏈式儲存結構實現（純程式碼）

每天一個數據結構-----線性表的鏈式（單鏈表）儲存結構

uefi bios pei 階段最重要的一個數據結構（結構體）

在PEI階段，全域性變數大概有這麼幾個： gPs PEI Service 結構的實現，包括所有的PEI 服務的函式指標。比如學見的PeiInstallPPi, PeiCreateHob, PeiSetSystem. 其次就是PrivateData，這個是今天我們要討論

https是如何加密的（知道了原理之後，希望自己能用程式碼實現一下，還有用於對個人資訊和公鑰進行加密的雜湊演算法，有時間也去查一下）

由於http協議是明文傳輸資料，資料的安全性沒有保障。為了改進這種明文傳輸協議，https誕生了。 https是在應用層和傳輸層之間，增加了一層ssl加密。對於加密，請往下看： 1、對稱加密每次在傳送資料之前，伺服器先生成一把金鑰，

買什麼資料結構與演算法，這裡有：動態圖解十大經典排序演算法（含JAVA程式碼實現）

上篇的動圖資料結構反響不錯，這次來個動圖排序演算法大全。資料結構與演算法，齊了。幾張動態圖捋清Java常用資料結構及其設計原理本文將採取動態圖+文字描述+正確的java程式碼實現來講解以下十大排序演算法：氣泡排序選擇排序插入排序希爾排序

codeforces 1058 D. Vasya and Triangle（已知面積求整數點座標，規律，利用__gcd把一個數拆成有範圍限制的兩個數相乘）

題意：給出橫座標最大值n，縱座標最大值m，再給出一個k要求，輸出三個整數點座標構成的三角形的面積為m*n/k 思路： (ps:利用__gcd把一個數拆成有範圍限制的兩個數相乘，不是對這個數的質因數貪心得去乘，湊那兩個範圍(這樣不行的) ) 令x1=y1=0 ，顯然

有n個人圍成一圈，從第1個人開始，1、2、3報數，報至3出局，餘下的人繼續從1、2、3報數，問：最後剩下的一人是原來的第幾號？同時求出被淘汰編號的序列。（要求：用迴圈佇列解決該問題。）

han.h: #include <iostream> #include <stdlib.h> #include "Status.h" using namespace std; typedef struct QNode {ElemType data;struct QNode *next;

雜湊變形—點陣圖（給定40億個不重複的無符號數整數，沒排過序，給一個無符號整數，如何快速判斷一個數是否在這40億個數中）

#include<stdio.h> #include<stdlib.h> #include<assert.h> #include<string.h> typedef struct BitMap { size_t* _bits

“1到10萬這些數，去除2個並打亂次序，如何找出那兩個數。（不準用點陣圖）”...

#include <algorithm> #include <iostream> #include <vector> #include <ctime> using namespace std; void shuffle(vect

給一個字串，有大小寫字母，要求寫一個函式把小寫字母放在前面大寫字母放在後面，儘量使用最小空間，時間複雜度。（即用指標做）。如：aAbBcCdD ---àabcdABCD

#include <stdlib.h> int SmallToCaptial( char *str, char *outbuf ) {char *p = str;if (str == NULL || outbuf == NULL){return -1;}while (*p){if (*p >

當你學會抄菜的時候，你就學會了大數據

抽油煙機鍋碗瓢盆大冬瓜豆腐塊宜家最近在學習數倉跟BI，突然發現，結合自己所學會抄的菜。試著把學過的大數據重新理解一番，希望各位都能來一起討論，共同進步。走進廚房走進廚房後，相信大家會看到各種鍋碗瓢盆，案板，切菜刀，調料，櫥櫃，水池...........而這些就相當於是大數

四種人“cai”在兄弟連戰狼班Java培訓，你屬於哪一種?

心態而且心理一點四種熱血沒有喜歡這樣的四種人“cai”在兄弟連戰狼班Java培訓，你屬於哪一種? 大家好，俺叫劉小財，這個名字的是父母起的，俺覺得父母是這個意思，無論做什麽要給自己留一個後路。俺來到兄弟連二個月，也慢慢適應了這裏的生活，每天都過

php 通過curl獲取遠程數據，返回的是一個數組型的字符串，高手幫忙如何將這個數組類型的字符串變成數組。

bsp 選項 con 獲取 pan 如果 clas exe transfer 如 Array([0] => Array([0] => Array([kd_status] => 已簽收[kd_time] => 2014-04-30 18:59:43 [

我有500w個單詞，你幫忙設計一個數據結構來進行儲存，存好之後，我有兩個需求。（程式人生程式碼copy）

相關推薦