JS高级-数据结构的封装

2022-02-10 04:01:37

最近在看了《数据结构与算法JavaScript描述》这本书，对大学里学的数据结构做了一次复习（其实差不多忘干净了，哈哈）。如果能将这些知识捡起来，融入到实际工作当中，估计编码水平将是一次质的飞跃。带着这个美好的愿望，开始学习吧O(∩_∩)O~~

我们知道在JS中，常常用来组织数据的无非是数组和对象（这些基础就不介绍了）。但在数据结构中，还有一些抽象的数据类型：列表、栈、队列、链表、字典、散列、集合、二叉树、图等，可以用来更好的对实际场景建模。当然这些数据类型，原生JS不支持，那么就需要通过封装来模拟，其底层还是数组和对象（被看穿喽~），接下来我们挨个来解析吧

一、列表

定义：列表是一组有序的数据，每个列表中的数据项称为元素。元素可以是任意数据类型，也不事先限定元素个数。

生活中经常使用到列表，通讯录、购物车、十佳榜单等。当不需要在一个很长的序列中查找元素或排序可以使用列表。

列表的封装代码：

function List() {//列表的构造函数

    this._dataStore = []; //初始化一个空数组来保存列表元素

    this._pos = 0;//当前的位置

}

List.prototype={

    constructor:List,

    clear:function(){//清空列表

        delete this._dataStore;

        this._dataStore = []; this._pos = 0;

    },

    find:function(element){//在列表中查找某一元素，若有返回位置，否则返回-1

        for (var i = 0; i < this._dataStore.length; ++i) {

            if (this._dataStore[i] === element) {return i;}

        };return -1;

    },

    contains:function(element){//判断给定值是否在列表中

        for (var i = 0; i < this._dataStore.length; ++i) {

            if (this._dataStore[i] === element) {return true; break;}

        };return false;

    },

    insert:function(element, after){//当前位置插入新元素

        var insert_pos = this.find(after);

        if (insert_pos > -1) {this._dataStore.splice(insert_pos+1, 0, element);return true;};

        return false;

    },

    append:function(element){this._dataStore[this._dataStore.length] = element;},//末尾添加新元素

    remove:function(element){//删除元素

        var foundAt = this.find(element);

        if (foundAt > -1) {this._dataStore.splice(foundAt,1);return true;};

        return false;

    },

    front:function(){this._pos = 0;},//将当前位置指针设为表首

    end:function(){this._pos = this._dataStore.length-1;},//将当前位置指针设为表尾

    prev:function(){if (this._pos > 0) {--this._pos;}},//当前位置上移指针

    next:function(){if (this._pos < this._dataStore.length-1) {++this._pos;}},//当前位置下移指针

    moveTo:function(_position){this._pos = _position;},//移动当前位置指针到指定位置

    length:function(){return this._dataStore.length;},//获取列表的中元素的个数

    curr_pos:function(){return this._pos;},//返回当前位置指针

    getElement:function(){return this._dataStore[this._pos];},//返回当前位置的列表项

    toString:function(){return this._dataStore;}//返回列表的字符串形式

}

列表与数组比较类似，只是简单的对数组做了二次封装，用案例来展示一下列表的使用场景，进一步加深理解。

案例：影碟租赁自助查询系统

var moviearr=['肖申克的救赎','教父','教父 2','低俗小说','黄金三镖客','十二怒汉','辛德勒名单','黑暗骑士','指环王：王者归来','搏击俱乐部','星球大战5：帝国反击战','飞越疯人院','指环王：护戒使者','盗梦空间','好家伙','星球大战','七武士','黑客帝国','阿甘正传','上帝之城']//数据

var movieList = new List();//电影列表

for (var i = 0; i < moviearr.length; ++i) {movieList.append(moviearr[i]);}//将数据添加到‘电影列表’

var customerList = new List();//客户列表

function Customer(name, movie) {//客户租赁对象的构造函数

    this.name = name;

    this.movie = movie;

}

function checkOut(name, movie, movieList, customerList) {//某客户需要租赁某电影，同时维护两个列表

        if(movieList.contains(movie)){//若检索电影在列表中，新建客户对象添加到客户列表，同时在电影列表中删除该电影

            var c = new Customer(name, movie);

            customerList.append(c);

            movieList.remove(movie);

        }else{console.log(movie + " is not available.");}//若不在电影列表中，则提示不可租赁

        //打印维护后的两个列表

        console.log('movieList:'+movieList.toString()+'\n customerList:'+JSON.stringify(customerList.toString()))

    }

checkOut('gavin','黑客帝国',movieList,customerList)

checkOut('gavin','星球大战',movieList,customerList)

checkOut('zoe','辛德勒名单',movieList,customerList)

checkOut('gulei','黑客帝国',movieList,customerList)

二、栈

定义：栈是一种特殊的列表，栈内的元素只能通过列表的一端访问，这一端称为栈顶。

栈是一种后入先出（ LIFO， last-in-first-out）的数据结构，任何不在栈顶的元素都无法访问。为了得到栈底的元素，必须先拿掉上面的元素。生活中常见的例子如：餐厅的一摞盘子，只能从上面逐个取，洗净的盘子也只能摞在最上面。

栈的封装代码：

function Stack() {//栈的构造函数

    this._dataStore = [];//初始化一个空数组来保存列表元素

    this._top = 0;//记录栈顶的位置

}

Stack.prototype={

    constructor:Stack,

    clear:function(){//清空栈

        delete this._dataStore;

        this._dataStore = []; this._top = 0;

    },

    push:function(element){this._dataStore[this._top++] = element;},//向栈内添加元素

    pop:function(){return this._dataStore[--this._top];},//从栈内取出元素

    peek:function(){return this._dataStore[this._top-1]},//查看栈顶元素

    length:function(){return this._top;}//获取列表的中元素的个数

}

相对列表来说，栈的方法不多显得很简洁，同样来几个案例，帮助理解栈的使用场景

案例一：回文

function isPalindrome(word){

    var s = new Stack();

    for (var i = 0; i < word.length; ++i) {s.push(word[i]);}

    var rword = "";

    while (s.length() > 0) {rword += s.pop();}

    if (word == rword) {return true;}else {return false;}

}

console.log(isPalindrome("hello"));//false

console.log(isPalindrome("racecar"));//true

案例二：递归演示

function factorial(n) {

    if (n === 0) {return 1;}else {return n * factorial(n-1);}

}

function fact(n) {

    var s = new Stack();

    while (n > 1) {s.push(n--);}

    var product = 1;

    while (s.length() > 0) {product *= s.pop();}

    return product;

}

console.log(factorial(5))//

console.log(fact(5))//

三、队列

定义：列队也是一种特殊的列表，不同的是队列只能在队尾插入元素，在队首删除元素。

列队是一种先进先出（ First-In-First-Out， FIFO）的数据结构。排在前面的优先处理，后面的依次排队，直到轮到它。生活中常见的例子如：打印任务池，模拟柜台排队的顾客等。

队列的封装代码：

function Queue() {//队列的构造函数

    this._dataStore = [];//初始化一个空数组来保存元素

}

Queue.prototype={

    constructor:Queue,

    clear:function(){//清空队列

        delete this._dataStore;

        this._dataStore = []; this._top = 0;

    },

    enqueue:function(element){this._dataStore.push(element)},//向队尾添加一个元素

    dequeue:function(){return this._dataStore.shift();},//删除队首元素

    front:function(){return this._dataStore[0];},//读取队首元素

    back:function(){return this._dataStore[this._dataStore.length-1];},//读取队尾元素

    empty:function(){if(this._dataStore.length === 0){return true;}else{return false;}},//判断队列是否为空

    toString:function(){//将队列元素拼接字符串

        var retStr = "";

        for (var i = 0; i < this._dataStore.length; ++i) {retStr += this._dataStore[i] + ",";}

        return retStr;

    }

}

列队比栈稍微复杂一点，总体来说也是比较容易理解的。

案例：舞伴分配

function Dancer(name, sex) {

    this.name = name;

    this.sex = sex;

}

function getDancers(males, females) {

    var names = ['F Allison McMillan','M Frank Opitz','M Mason McMillan','M Clayton Ruff','F Cheryl Ferenback','M Raymond Williams','F Jennifer Ingram','M Bryan Frazer','M David Durr','M Danny Martin','F Aurora Adney'];

    for(var i = 0; i < names.length; ++i) {

        var dancer = names[i].split(" ");

        var sex = dancer[0];

        var name = dancer[1];

        if (sex == "F") {females.enqueue(new Dancer(name, sex));

        } else {males.enqueue(new Dancer(name, sex));}

    }

}

function dance(males, females) {

    console.log("The dance partners are: \n");

    while (!females.empty() && !males.empty()) {

        var person1 = females.dequeue();

        var person2 = males.dequeue();

        console.log("Female dancer is: " + person1.name+" and the male dancer is: " + person2.name);

    }

}

var maleDancers = new Queue();

var femaleDancers = new Queue();

getDancers(maleDancers, femaleDancers);

dance(maleDancers, femaleDancers);

if (!femaleDancers.empty()) {console.log(femaleDancers.front().name + " is waiting to dance.");}

if (!maleDancers.empty()) {console.log(maleDancers.front().name + " is waiting to dance.");}

在一般情况下，从列表中删除元素是优先删除先入队的元素，但有时候也可能需要使用一种优先队列的数据来模拟，比如医院的急诊，主要通过给队列中每个元素添加一个优先级别，并改写dequeue方法实现。

dequeue:function() {

    var priority = this._dataStore[0].code;//code表示优先级别，数值越小优先级越高

    for (var i = 1; i < this._dataStore.length; ++i) {priority =Math.min(priority,i);}

    return this.dataStore.splice(priority,1);

}

四、链表

定义：链表是由一组节点组成的集合，每个节点都使用一个对象的引用指向下一个节点，这个引用叫做链。

除了对数据的随机访问，链表几乎可以代替一维数组。它与数组的主要区别是：数组的元素靠位置进行引用，链表靠相互指向进行引用。

链表的封装代码：

function Node(element) {//链表中节点的构造函数

    this.element = element;

    this.next = null;

}

function LList() {//链表的构造函数

    this.head = new Node("head");

}

LList.prototype={

    constructor:LList,

    find:function(item){//查找链表，如果找到则返回该节点，否者返回头节点

        var currNode = this.head;

        while (currNode.element != item) {currNode = currNode.next;}

        return currNode;

    },

    insert:function(newElement, item){//在找到的节点后，新增一个节点

        var newNode = new Node(newElement);//新增节点

        var current = this.find(item);//查找节点

        newNode.next = current.next;//先将当前节点的next赋值给新节点的next

        current.next = newNode;//再将当前节点的next设置为新节点

    },

    display:function(){

        var currNode = this.head;

        while (currNode.next!==null){console.log(currNode.next.element);currNode = currNode.next; }

    },

    findPrev:function(item){//查找链表，返回当前节点的上一个节点

        var currNode = this.head;

        while (currNode.next!==null && currNode.next.element!==item){ currNode = currNode.next; }

        return currNode;

    },

    remove:function(item){//在链表中删除给定的节点

        var prevNode = this.findPrev(item);

        if (prevNode.next !== null) { prevNode.next = prevNode.next.next;}

    }

}

跟之前的三种数据结构不同，链表没有采用数组作为底层数据存储。而是采用对象节点作为基础，同时每个节点中都含有一个next属性指向另一个对象，与优先队列的中的优先级别code颇为类似。总体来看链表是通过每个节点的next属性，将散列的对象连接到了一起。

如上我们只是实现了单向链表，从头遍历到尾很简单，想要反过来遍历就没那么容易了。我们可以通过给节点增加一个prev属性，指向它的前一个节点，也能实现双向链表。当然，双向链表在新增和删除节点时的操作也要复杂一些，需要同时修改前后节点的next或prev属性。

另外，我们还可以让单向链表的尾节点指向首节点，这样就变成了循环列表。这样需要对链表的一些方法进行改造，防止遍历链表时出现无限循环。

五、字典

定义：字典是一种以键值对形式存储的数据结构。

JS中对象就是以字典的形式设计的，但字典的基础是数组，而不是对象。这样可以进行排序，况且JS中一切皆对象，数组也不例外。

字典的封装代码：

function Dictionary() {//字典的构造函数

    this._datastore = new Array();

}

Dictionary.prototype={

    constructor:Dictionary,

    add:function(key,value){ this._datastore[key]=value; },//增加一条键值对

    find:function(key){ return this._datastore[key] },//查找指定key，返回对应value的值

    remove:function(key){ delete this._datastore[key] },//删除指定key的键值对

    showAll:function(){ //打印字典的所有键值对

        //若需排序可以给Object.keys(this._datastore)数组追加sort方法

        Object.keys(this._datastore).forEach(function(key){console.log(key+" -> "+this._datastore[key]);}.bind(this))

    },

    count:function(){//返回字典所含键值对数量

        var n = 0;

        for(var key in this._datastore) {++n;}

        return n;

    },

    clear:function(){ //清空字典

        Object.keys(this._datastore).forEach(function(key){ delete this._datastore[key];}.bind(this))

    }

}

字典依然采用数组作为底层数据存储，但是与普通按序号索引的数组不同，它只能以key进行查询。

六、散列

定义：散列是一种常用的数据存储技术，散列后的数据可以快速地插入或取用。散列使用的数据结构叫做散列表。

是通过一个散列函数（Hash，哈希）将键映射为一个范围是 0 到散列表长度的数字。

散列的封装代码：

function HashTable() {//散列的构造函数

    this._table = new Array(137);//数组的长度应该为质数，即预算散列表的长度

}

HashTable.prototype={

    constructor:HashTable,

    simpleHash:function(data){//简单的散列函数（返回键字符串的ASCII累加除数组长度的余数）

        var total = 0;

        for (var i = 0; i < data.length; ++i) {total += data.charCodeAt(i);}

        return total % this._table.length;

    },

    betterHash:function(data){//更好的散列函数算法，减少碰撞

        const H = 37;

        var total = 0;

        for (var i = 0; i < data.length; ++i) {total += H * total + data.charCodeAt(i);}

        total = total % this._table.length;

        if (total < 0) {total += this._table.length-1;}

        return parseInt(total);

    },

    put:function(data){var pos = this.simpleHash(data);this._table[pos] = data;},//使用简单散列函数

    //put:function(key,data){var pos = this.betterHash(key);this._table[pos] = data;},//使用高级散列函数

    showDistro:function(){//显示散列表中的数据

        var n = 0;

        for (var i = 0; i < this._table.length; ++i) {

            if (this._table[i] !== undefined) {console.log(i + ": " + this._table[i]);}

        }

    },

    get:function(key){return this._table[this.betterHash(key)];},

}

散列其实是通过一种机制（散列函数），将数据存储到散列表对应的位置上去，当机制跟内容相关时仅出现修改才会改变。（MD5类似散列函数的机制）

当散列函数对于多个输入产生同样的输出时称为碰撞。开链法（用数组存储多个相同输出）和探测法（线性探测下个位置，直到有空值存入）

案列：数据存储

var students = ["David", "Jennifer", "Donnie", "Raymond", "Cynthia", "Mike", "Clayton", "Danny", "Jonathan"];

var hTable = new HashTable();

for (var i = 0; i < students.length; ++i) {hTable.put(students[i]);}

hTable.showDistro();//九条数据，被散列成八条，产生于了一个碰撞

七、集合

定义：是一种不含不同元素的数据结构，这些元素是无序且不重复的。

集合的封装代码：

function Set() {//集合的构造函数

    this._dataStore = [];

}

Set.prototype={

    constructor:Set,

    add:function(data){//向集合中添加元素

        if (this._dataStore.indexOf(data) < 0) {this._dataStore.push(data);return true;

        } else {return false;}

    },

    remove:function(data){//从集合中移除元素

        var pos = this._dataStore.indexOf(data);

        if (pos > -1) {this._dataStore.splice(pos,1);return true;

        } else {return false;}

    },

    contains:function(){//检查一个元素是否在集合中

        if (this._dataStore.indexOf(data) > -1) {return true;} else {return false;}

    },

    size:function(){return this._dataStore.length},//返回集合的长度

    union:function(set){//返回与另一个集合的并集

        var tempSet = new Set();

        for (var i = 0; i < this._dataStore.length; ++i) {tempSet.add(this._dataStore[i]);}

        for (var i = 0; i < set.dataStore.length; ++i) {

            if (!tempSet.contains(set.dataStore[i])) {tempSet.dataStore.push(set.dataStore[i]);}

        }

        return tempSet;

    },

    intersect:function(set){//返回与另一个集合的交集

        var tempSet = new Set();

        for (var i = 0; i < this._dataStore.length; ++i) {

            if (set.contains(this._dataStore[i])) {tempSet.add(this._dataStore[i]);}

        }

        return tempSet;

    },

    subset:function(set){//判断集合是否其他集合的子集

        if (this.size() > set.size()) {return false;

        } else {

            this._dataStore.foreach(function(member){if (!set.contains(member)) {return false;}})

        }

        return true;

    },

    difference:function(set){//返回与另一个集合的补集

        var tempSet = new Set();

        for (var i = 0; i < this._dataStore.length; ++i) {

            if (!set.contains(this._dataStore[i])) {tempSet.add(this._dataStore[i]);}

        }

        return tempSet;

    },

    show:function(){return this._dataStore;},//显示集合中的元素

}

集合的数据结构比较简单，主要实现了添加元素时检查唯一性，以及交集、并集、补集的方法和子集的检查。

八、二叉树和二叉查找树

定义：树由一组以边连接的节点组成，二叉树是子节点不超过两个的特殊树。

二叉树的封装代码：

function Node2(data, left, right) {//二叉树中节点的构造函数

    this.data = data;

    this.left = left;

    this.right = right;

    this.show = function(){return this.data;};

}

function BST(){//二叉查找树的构造函数

    this.root = null;

}

BST.prototype={

    constructor:BST,

    insert:function(data){//插入节点

        var n = new Node2(data, null, null);

        if (this.root == null) {

            this.root = n;

        } else {

            var current = this.root;

            var parent;

            while (true) {

                parent = current;

                if (data < current.data) {

                    current = current.left;if (current == null) {parent.left = n;break;}

                } else {

                    current = current.right;if (current == null) {parent.right = n;break;}

                }

            }

        }

    },

    inOrder:function(node){

        if (!(node == null)) {

        this.inOrder(node.left);

        console.log(node.show() + " ");

        this.inOrder(node.right);

        }

    },

    getMin:function(){//获取最小的数，即最左节点

        var current = this.root;

        while (!(current.left == null)) {current = current.left;}

        return current.data;

    },

    getMax:function(){//获取最大的数，即最右节点

        var current = this.root;

        while (!(current.right == null)) {current = current.right;}

        return current.data;

    },

    find:function(data){//查找指定的值

        var current = this.root;

        while (current != null) {

            if (current.data == data) {return current;

            } else if (data < current.data) {current = current.left;

            } else {current = current.right;}

        }

        return null;

    },

    remove:function(data){ root = this.removeNode(this.root, data);},//调用removeNode删除节点

    removeNode:function(node,data){ //删除节点

        if (node == null) {return null;}

        if (data == node.data) {

            if (node.left == null && node.right == null) {return null;} // 没有子节点的节点

            if (node.left == null) {return node.right;} // 没有左子节点的节点

            if (node.right == null) {return node.left;} // 没有右子节点的节点

            // 有两个子节点的节点

            var tempNode = getSmallest(node.right);

            node.data = tempNode.data;

            node.right = removeNode(node.right, tempNode.data);

            return node;

        } else if (data < node.data) {

            node.left = removeNode(node.left, data);

            return node;

        } else {

            node.right = removeNode(node.right, data);

            return node;

        }

    }

}

二叉树有点类似链表的数据结构，采用节点的左右属性来指向两个子节点。

九、图和图算法

定义：图是由边的集合即顶点的集合组成的。常用于地图和航班等信息数据的建模。

图的封装代码：

function Graph(v) {//图的构造函数,v表示顶点的数量

    this.vertices = v;

    this.edges = 0;

    this.adj = [];

    for (var i = 0; i < this.vertices; ++i) {

        this.adj[i] = [];

        this.adj[i].push("");

    }

    this.marked = [];//遍历标志位

    for (var i = 0; i < this.vertices; ++i) {this.marked[i] = false;}

    this.edgeTo = [];//路径查找时，存储两个顶点之间的边

}

Graph.prototype={

    constructor:Graph,

    addEdge:function(v,w){//增加一条从顶点v到顶点w的边

        this.adj[v].push(w);

        this.adj[w].push(v);

        this.edges++;

    },

    showGraph:function(){var p='';//显示当前图的结构

        for (var i = 0; i < this.vertices; ++i) { p+='顶点'+i+' ->';

            for (var j = 0; j < this.vertices; ++j) {

                if (this.adj[i][j] !== undefined){ p+=this.adj[i][j]+' ';}

            };p+='\n';

        }console.log(p)

    },

    dfs:function(v){//深度优先搜索

        this.marked[v] = true;

        if (this.adj[v] !== undefined) {console.log("深度优先: " + v);}

        for(var w in this.adj[v]) {

            if(!this.marked[this.adj[v][w]]){this.dfs(this.adj[v][w]);}

        }

    },

    bfs:function(s){//广度优先搜索

        var queue = [];

        this.marked[s] = true;

        queue.push(s); // 添加到队尾

        while (queue.length > 0) {

            var v = queue.shift(); // 从队首移除

            if (v!==''&&v !== undefined) {console.log("广度优先: " + v);}

            for(var w in this.adj[v]) {

                if (!this.marked[this.adj[v][w]]) {

                    this.marked[this.adj[v][w]] = true;

                    this.edgeTo[this.adj[v][w]] = v;

                    queue.push(this.adj[v][w]);

                }

            }

        }

    },

    pathTo:function(v){//获取最短路径，即顶点v到顶点0的边（必须先广度搜索生成edgeTo）

        var source = 0;

        if (!this.marked[v]) {return undefined;}

        var path = [];

        for (var i = v; i != source; i = this.edgeTo[i]) {path.push(i);}

        path.push(source);

        return path;

    }

}

在对图数据模型进行搜索时，有深度优先和广度优先两种。当进行最短路径查找时，就是广度优先搜索的过程。

码农公寓

相关文章