trie樹查找和hash查找比較（大量數據）

阿新 • • 發佈：2017-07-17

stdlib.h emp lib ras eno strlen oid ack std

trie樹代碼

#include<iostream>
#include<stdio.h>
#include<iostream>
#include<string>
#include<stdlib.h>
#include<fstream>
#include<sstream>
#include<vector>
#include<string>
#include<time.h>
using namespace std;
class trienode
{
public:
    char 
 *word;
    int count;
    trienode *branch[26];
public:
    trienode()
    {
        word = NULL;
        count = 0;//詞頻
        memset(branch, NULL, sizeof(trienode*) * 26);
    }
};
class trie
{
public:
    trienode *root;
public:
    trie();
    ~trie();
    void Insert(char *str);
    bool Search(char 
*str, int &count);//索引
    void printall(trienode *root);//字符排序
    void printpre(char *str);//前綴匹配
};
trie::trie()
{
    root = new trienode();
}
trie::~trie() {}
void trie::Insert(char *str)
{
    int index;
    trienode *tt = root;
    for (int i = 0; str[i]; i++)
    {
        index = str[i] - ‘a‘;
         
if (index < 0 || index>26)
        {
            return;
        }
        if (tt->branch[index] == NULL)
        {
            tt->branch[index] = new trienode();
        }
        tt = tt->branch[index];
    }
    if (tt->word)
    {
        tt->count++;
        return;
    }
    else
    {
        tt->count++;
        tt->word = new char[strlen(str) + 1];
        strcpy_s(tt->word, strlen(str) + 1, str);
    }

}
bool trie::Search(char *str, int &count)
{
    int index = -1;
    trienode *tt = root;
    while (tt&&*str)
    {
        index = *str - ‘a‘;
        if (index < 0 || index>26) return false;
        tt = tt->branch[index];
        str++;
    }
    if (tt&&tt->word)
    {
        count = tt->count;
        return true;
    }
    return false;
}
void trie::printall(trienode *root)
{
    trienode *t = root;
    if (!t) return;
    if (t->word)
    {
        cout << t->word << endl;
    }
    for (int i = 0; i < 26; i++)
    {
        printall(t->branch[i]);
    }

}
void trie::printpre(char *str)
{
    trienode *t = root;
    int index = -1;
    while (t&&*str)
    {
        index = *str - ‘a‘;
        if (index < 0 || index>26) return;
        t = t->branch[index];
        str++;
    }
    if (t)
    {
        printall(t);
    }
}
int main()
{
    clock_t startTime, endTime;
    startTime = clock();
    trie *t = new trie();
    ifstream it("C:/Users/ww/Desktop/string.txt");
    string sline;
    string str = "";
    while (it&&getline(it, sline))
    {
        str += sline + " ";
    }
    it.close();
    for (int i = 0; i < str.length(); i++)
    {
        if (str[i] == ‘.‘ || str[i] == ‘,‘ || str[i] == ‘(‘ || str[i] == ‘(‘)
        {
            str.erase(i, 1);
        }
    }
    string word;
    stringstream ss(str);
    vector<string> vec;
    while (ss >> word)
    {
        vec.push_back(word);
    }
    vector<string>::iterator iter;
    for (iter = vec.begin(); iter != vec.end(); iter++)
    {
        t->Insert((char*)(*iter).data());
    }
    int val = -1;
    if (t->Search("the", val))
    {
        cout << val << endl;
    }
    else
    {
        cout << "empty" << endl;
    }
    endTime = clock();
    cout << "the running time is " << (double)(endTime - startTime) << endl;
    return 0;
}

hash代碼

#include<iostream>
#include<fstream>
#include<sstream>
#include<string>
#include<vector>
#include<stdlib.h>
#include<time.h>
using namespace std;
class hashnode
{
public:
    char *p;
    hashnode *next;
};
class hashmap
{
public:
    hashnode *hashps[1000];
public:
    hashmap();
    ~hashmap();
    int String2Int(char *p);
    void Insert(char *p);
    bool Find(char *p);
};
hashmap::hashmap()
{
    for (int i = 0; i < 1000; i++)
    {
        hashps[i] = new hashnode();
    }
    for (int i = 0; i < 1000; i++)
    {
        hashps[i]->next = NULL;
    }
}
hashmap::~hashmap() {}
int hashmap::String2Int(char *p)
{
    int num = 0;
    while (*p)
    {
        num += *p;
        p++;
    }
    return num % 1000;
}
void hashmap::Insert(char *p)
{
    int index = String2Int(p);
    hashnode *hash = hashps[index];
    hashnode *newr = new hashnode();
    newr->p = new char[strlen(p) + 1];
    strcpy_s(newr->p, strlen(p) + 1, p);
    newr->next = hash->next;
    hash->next = newr;
}
bool hashmap::Find(char *p)
{
    int index = String2Int(p);
    hashnode *t = hashps[index]->next;
    if (!t)
    {
        return false;
    }
    else
    {
        hashnode *w = t;
        while (w)
        {
            if (strcmp(p, w->p)==0)
            {
                return true;
            }
            w = w->next;
        }
    }
}
int re(int *p)
{
    return *p;
}
int main()
{
    clock_t startTime, endTime;
    startTime = clock();
    hashmap *t = new hashmap();
    ifstream it("C:/Users/ww/Desktop/string.txt");
    string sline;
    string str = "";
    while (it&&getline(it, sline))
    {
        str += sline + " ";
    }
    it.close();
    for (int i = 0; i < str.length(); i++)
    {
        if (str[i] == ‘.‘ || str[i] == ‘,‘ || str[i] == ‘(‘ || str[i] == ‘(‘)
        {
            str.erase(i, 1);
        }
    }
    stringstream ss(str);
    string word;
    vector<string> vec;
    while (ss >> word)
    {
        vec.push_back(word);
    }
    vector<string>::iterator iter;
    for (iter = vec.begin(); iter != vec.end(); iter++)
    {
        t->Insert((char*)(*iter).data());
    }
    cout << "the result is: " << t->Find("the") << endl;
    endTime = clock();
    cout << "the running time is " << (double)(endTime - startTime) << endl;
    return 0;
}

trie樹查找時間是O(L)L是字符串長度，而hash是O(LL)，LL是關鍵字對應哈希地址鏈表長度,都和數據的大小無關，查找都很高效

trie樹查找和hash查找比較（大量數據）

stdlib.h emp lib ras eno strlen oid ack std trie樹代碼 #include<iostream> #include<stdio.h> #include<iostream> #include&l

AutomaticallyProfile 自動化引擎 MyBatis和DB溝通的引擎（根據數據庫信息自動給生成實體類那些...）

... 數據庫名 ica cmd 信息 images 類名 sources 生成 1.首先建立一個文件夾AutomaticallyProfile 文件夾內有四個jar包：mysql.jar mybat

文件查找和壓縮——Linux基本命令（12）

linux1.文件查找在文件系統上查找符合條件的文件：locate, find非實時查找(數據庫查找)：locate實時查找：find 2.locate（1）功能特點查詢系統上預建的文件索引數據庫/var/lib/mlocate/mlocate.db依賴於事先構建的索引索引的構建是在系統較為空閑時自動進行

順序查找和二分查找代碼

malloc pan maxsize inpu struct keys int ted print /************************************************************************* > Fi

算法-基礎和查找-1.漢諾塔/2.順序查找/3.二分查找/4.順序查找和二分查找的比較

arc none spl opened spa earch 每次 int 順序 1.漢諾塔：　　如下圖所示，需要將A柱子中的所有圓盤按照從小到大的順序移動到C柱子上，並且在移動過程中大圓盤不能在小圓盤上面　　　　分析問題：最終希望呈現的結果是將A柱子上的盤子全部按照從

樹的直徑和並查集判環

#include<iostream> #include<algorithm> #include<cstring> #include<cstdio> #include<queue> #define maxn 2000

（LeetCode 513）找樹左下角的值 [DFS + 找樹左下角的值=葉子節點 + 最左（第一次出現） ]

513. 找樹左下角的值給定一個二叉樹，在樹的最後一行找到最左邊的值。示例 1: 輸入: 2 / \ 1 3 輸出: 1 示例 2: 輸入: 1 / \ 2 3 / / \

Trie樹的構建和應用

Trie樹又叫“字典樹”，是一種在字串計算中極為常見的資料結構。在介紹Trie樹的具體結構之前，我們首先要搞明白的就是Trie樹究竟是用來解決哪一類問題的，為什麼這類問題可以用Trie樹高效的解決。我們為什麼用Trie樹 1. 節約字串的儲存空間

輸入一串字元，只包含“0-10”和“,”，找出其中最小的數字和最大的數字（可能不止一個），輸出最後剩餘數字個數

輸入一串字元，只包含“0-10”和“，”找出其中最小的數字和最大的數字（可能不止一個），輸出最後剩餘數字個數。如：輸入 “3,3,4,5,6,7,7” 輸出 3 支援0-10 #include "stdafx.h" int _tmain(int a

svn報錯“請求的名稱有效但是找不到請求的類型的數據”的解決方案之一

svn 報錯請求　　昨天收到同事的易信，說是svn不能用了。　　由於只有他自己反映無法使用，而且，我使用svn也沒有問題。因此，這事基本應該和服務沒什麽關系。看了一下進程，也沒什麽問題。[[email protected]/* */ svndata]# ps -ef|grep sv

一、查看Linux內核版本命令（兩種方法）：

use proc color tex 2.6 distrib oot lin hat 一、查看Linux內核版本命令（兩種方法）：1、cat /proc/version[[email protected]CentOS home]# cat /proc/versio

轉載：哈夫曼樹的構造和哈夫曼編碼（C++代碼實現）

作者 pos blank 字符 element start man null == 作者：qiqifanqi 原文：http://blog.csdn.net/qiqifanqi/article/details/6038822 #include<stdio.h>

SQL Server 表的管理_關於表的操作增刪查改的操作的詳解（案例代碼）

har table 詳解增刪 .com ble tab SQ eat SQL Server 表的管理_關於表的操作增刪查改的操作的詳解（案例代碼）概述：表由行和列組成，每個表都必須有個表名。 SQL CREATE TABLE 語法 CREATE T

vue打包後出現靜態資源|（圖片，json數據）找不到路徑

CP 解決 png 路徑分享圖片分享 com 奇跡 public 最近在學習Vue是如何編寫項目的，在踩了許多坑後，終於要到了最後一步npm run build了，很開心的等待奇跡，然後打包後出現了找不到圖片路徑的問題。解決辦法：1.將圖片或者json數據文件夾放到s

oracle 表連線方式： nested loop 巢狀迴圈和Hash Join的比較

一、建立兩張實驗用表：wireless_site.merchant和wireless_site.bb SQL> select count(*) from wireless_site.merchant; COUNT(*) ---------- 14005

Eclipse找出所有中文字元方法（全球化開發方式）

Eclipse 中,將專案中的所有中文字元找到,並替換,雖然我們平時開發不用中文，但不能保證一定就沒有中文字元出現。利用eclipse正則查詢 CTRL+H 輸入[^\x00-\xff]包括方括號，並且選中“Regualr expression” 就把所有的中文字元找出來了，很方便吧！

redis數據類型四之hash的指令操作（五種數據類型中最重要的一種）

redis數據類型 hash的指令操作 1、老規矩，看看redis官方文檔怎麽寫: 這裏說呢，hashes 這種數據類型容易代表對象，實際上你可以無限制地在 hash 中放給定數量的字段。（除了可用的內存）（其實這個我理解有些模糊，是內存能夠滿足就可以無限制的放入嗎？）所

樹狀數組的進階運用（Stars 數星星）

p s 計算 right star http 復雜一個 examine maps 英文原題 Problem Description Astronomers often examine star maps where stars are represented by poi

向後端請求數據以及像後端發送數據要求（刪除數據和添加數據）

doc content request 使用 style except 刪除數據庫 cal data 刪除數據和添加數據只能後端操作刪除數據和添加數據都要用到的html（一）部分 <!DOCTYPE html><html lang="en">&

老司機帶你用MaxCompute和表格存儲玩轉車聯網數據

tps 爆發 sqlserve 屬性分庫所有 spa 控制定期原文鏈接 “自動駕駛汽車”在近兩年頻頻出現於各大科技新聞頭條，自2012年谷歌獲得美國首個自動駕駛汽車許可證以來，國外各大知名汽車廠商如奔馳、沃爾沃、大眾、通用、豐田、日產、特斯拉等也紛紛宣布自己的自動駕

trie樹查找和hash查找比較（大量數據）

相關推薦