diff.js 列表对比算法源码分析

diff.js列表对比算法源码分析

npm上的代码可以查看（https://www.npmjs.com/package/list-diff2) 源码如下：

 /**

  *

  * @param {Array} oldList   原始列表

  * @param {Array} newList   新列表

  * @param {String} key 键名称

  * @return {Object} {children: [], moves: [] }

  * children 是源列表 根据 新列表返回 移动的新数据，比如 oldList = [{id: 1}, {id: 2}, {id: 3}, {id: 4}, {id: 5}, {id: 6}];

  newList = [{id: 2}, {id: 3}, {id: 1}]; 最后返回的children = [

   {id: 1},

   {id: 2},

   {id: 3},

   null,

   null,

   null

  ]

  moves 是源列表oldList 根据新列表newList 返回的操作，children为null的话，依次删除掉掉，因此返回的是

  moves = [

   {type: 0, index:3},

   {type: 0, index: 3},

   {type: 0, index: 3},

   {type: 0, index: 0},

   {type: 1, index: 2, item: {id: 1}}

  ]

  注意：type = 0 是删除操作， type = 1 是新增操作

 */

 function diff(oldList, newList, key) {

   var oldMap = makeKeyIndexAndFree(oldList, key);

   var newMap = makeKeyIndexAndFree(newList, key);

   var newFree = newMap.free;

   var oldKeyIndex = oldMap.keyIndex;

   var newKeyIndex = newMap.keyIndex;

   var moves = [];

   var children = [];

   var i = 0;

   var freeIndex = 0;

   var item;

   var itemKey;

   while(i < oldList.length) {

     item = oldList[i];

     itemKey = getItemKey(item, key);

     if(itemKey) {

       if(!newKeyIndex.hasOwnProperty(itemKey)) {

         children.push(null);

       } else {

         var newItemIndex = newKeyIndex[itemKey];

         children.push(newList[newItemIndex]);

       }

     } else {

       var freeItem = newFree[freeIndex++];

       children.push(freeItem || null);

     }

     i++;

   }

   // 删除不存在的项

   var simulateList = children.slice(0);

   i = 0;

   while (i < simulateList.length) {

     if (simulateList[i] === null) {

       remove(i);

       // 调用该方法执行删除

       removeSimulate(i);

     } else {

       i++;

     }

   }

   //

   var j = i = 0;

   while (i < newList.length) {

     item = newList[i];

     itemKey = getItemKey(item, key);

     var simulateItem = simulateList[j];

     var simulateItemKey = getItemKey(simulateItem, key);

     if (simulateItem) {

       if (itemKey === simulateItemKey) {

         j++;

       } else {

         // 新的一项，插入

         if (!oldKeyIndex.hasOwnProperty(itemKey)) {

           insert(i, item);

         } else {

           var nextItemKey = getItemKey(simulateList[j + 1], key);

           if (nextItemKey === itemKey) {

             remove(i);

             removeSimulate(j);

             j++;

           } else {

             insert(i, item);

           }

         }

       }

     } else {

       insert(i, item);

     }

     i++;

   }

   function remove(index) {

     var move = {index: index, type: 0};

     moves.push(move);

   }

   function insert(index, item) {

     var move = {index: index, item: item, type: 1};

     moves.push(move);

   }

   function removeSimulate(index) {

     simulateList.splice(index, 1);

   }

   return {

     moves: moves,

     children: children

   }

 }

 /*

  * 列表转化为 keyIndex 对象

  * 比如如下代码：

  var list = [{key: 'id1'}, {key: 'id2'}, {key: 'id3'}, {key: 'id4'}]

  var map = diff.makeKeyIndexAndFree(list, 'key');

  console.log(map);

 // {

   keyIndex: {id1: 0, id2: 1, id3: 2, id4: 3},

   free: []

 }

  * @param {Array} list

  * @param {String|Function} key

 */

 function makeKeyIndexAndFree(list, key) {

   var keyIndex = {};

   var free = [];

   for (var i = 0, len = list.length; i < len; i++) {

     var item = list[i];

     var itemKey = getItemKey(item, key);

     if (itemKey) {

       keyIndex[itemKey] = i;

     } else {

       free.push(item);

     }

   }

   return {

     keyIndex: keyIndex,

     free: free

   }

 }

 function getItemKey(item, key) {

   if (!item || !key) {

     return;

   }

   return typeof key === 'string' ? item[key] : key[item]

 }

 exports.makeKeyIndexAndFree = makeKeyIndexAndFree;

 exports.diff = diff;

该js的作用是：深度遍历两个列表数据，每层的节点进行对比，记录下每个节点的差异。并返回该对象的差异。
@return {Object} {children: [], moves: [] }
children 是源列表根据新列表返回移动或新增的数据。

比如

oldList = [{id: 1}, {id: 2}, {id: 3}, {id: 4}, {id: 5}, {id: 6}];

newList = [{id: 2}, {id: 3}, {id: 1}];

最后返回的

children = [

  {id: 1},

  {id: 2},

  {id: 3},

  null,

  null,

  null

 ]

moves 是源列表oldList 根据新列表newList 返回的操作，children为null的话，依次删除掉掉，因此返回的是

moves = [

  {type: 0, index:3},

  {type: 0, index: 3},

  {type: 0, index: 3},

  {type: 0, index: 0},

  {type: 1, index: 2, item: {id: 1}}

]

注意：type = 0 是删除操作， type = 1 是新增操作
因为

oldList = [{id: 1}, {id: 2}, {id: 3}, {id: 4}, {id: 5}, {id: 6}]; 
newList = [{id: 2}, {id: 3}, {id: 1}];

所以oldList根据newList来对比，{id: 4} 和 {id: 5} 和 {id: 6} 在新节点 newList没有找到，因此在moves设置为 {type:0, index:3},
所以oldList数据依次变为 [{id: 1}, {id: 2}, {id: 3}, {id: 5}, {id: 6}] 和 [{id: 1}, {id: 2}, {id: 3}, {id: 6}] 和 [{id: 1}, {id: 2}, {id: 3}]
每次在moves存储了一次的话，原数组会删掉当前的一项，因此oldList 变为 [{id: 1}, {id: 2}, {id: 3}], newList 为 [{id: 2}, {id: 3}, {id: 1}],
然后各自取出该值进行比较，也就是 oldList变为 [1, 2, 3], newList变为 [2, 3, 1]; 因此oldList相对于 newList来讲的话，第一项不相同就删掉该项所以moves新增一项{type: 0, index:0}, index从0开始的，表示第一项被删除，然后第二项1被添加，因此moves再加一项 {type: 1, index:2, item: {id: 1}}；
代码理解如下：

该方法需要传入三个参数 oldLsit, newList, key;
oldList 和 newList 是原始数组和新数组， key是根据键名进行匹配。

现在分别对oldList 和 newList 传值如下数据：
var oldLsit = [{id: 1}, {id: 2}, {id: 3}, {id: 4}, {id: 5}, {id: 6}];
var newList = [{id: 2}, {id: 3}, {id: 1}];

因此 var oldMap = makeKeyIndexAndFree(oldList, key);
makeKeyIndexAndFree代码如下：

function makeKeyIndexAndFree(list, key) {

  var keyIndex = {};

  var free = [];

  for (var i = 0, len = list.length; i < len; i++) {

    var item = list[i];

    var itemKey = getItemKey(item, key);

    if (itemKey) {

      keyIndex[itemKey] = i;

    } else {

      free.push(item);

    }

  }

  return {

    keyIndex: keyIndex,

    free: free

  }

}

getItemKey 代码如下：

function getItemKey(item, key) {

  if (!item || !key) {

    return;

  }

  return typeof key === 'string' ? item[key] : key[item]

}

执行代码变成如下：

var oldMap = {

  keyIndex: {

    1: 0,

    2: 1,

    3: 2,

    4: 3,

    5: 4,

    6: 5

  },

  free: []

}

var newMap = makeKeyIndexAndFree(newList, key); 输出如下：

var newMap = {

  free: [],

  keyIndex: {

    1: 2,

    2: 0,

    3: 1

  }

}

注意：上面的是把{id: xx} 中的xx当做键，但是当xx是数字的话，他会把数字当做索引位置来存储。

var newFree = newMap.free = [];

var oldKeyIndex = oldMap.keyIndex;

var newKeyIndex = newMap.keyIndex;

var moves = [];

var children = [];

var i = 0;

var freeIndex = 0;

var item;

var itemKey;

while(i < oldList.length) {

  item = oldList[i];

  itemKey = getItemKey(item, key);

  if(itemKey) {

    if(!newKeyIndex.hasOwnProperty(itemKey)) {

      children.push(null);

    } else {

      var newItemIndex = newKeyIndex[itemKey];

      children.push(newList[newItemIndex]);

    }

  } else {

    var freeItem = newFree[freeIndex++];

    children.push(freeItem || null);

  }

  i++;

}

while循环旧节点oldList，获取其某一项，比如 {id: 1}, {id: 2}, {id: 3}, {id: 4}, {id: 5}, {id: 6}, 然后根据键名获取某一项的值，分别为：1,2,3,4,5,6。
然后判断新节点中的 newKeyIndex 是否有该属性键名，newKeyIndex = {1: 2, 2: 0, 3: 1}, 判断newKeyIndex 是否有属性 1, 2, 3, 4, 5, 6, 如果没有的话，把null放到children数组里面去，如果有的话，存入children数组里面去，因此children的值变为如下：

children = [

  {id: 1},

  {id: 2},

  {id: 3},

  null,

  null,

  null

];

// 删除不存在的项

var simulateList = children.slice(0);

i = 0;

while (i < simulateList.length) {

  if (simulateList[i] === null) {

    remove(i);

    // 调用该方法执行删除

    removeSimulate(i);

  } else {

    i++;

  }

}

把children数组的值赋值到 simulateList列表中，如果某一项等于null的话，调用 remove(i)方法，把null值以对象的形式保存到moves数组里面去，
同时删除simulateList列表中的null数据。
代码如下：

function remove(index) {

  var move = {index: index, type: 0};

  moves.push(move);

}

function removeSimulate(index) {

  simulateList.splice(index, 1);

}

simulateList 数据变成如下：

simulateList = [

  {id： 1},

  {id:  2},

  {id:  3}

];

因此 moves 变成如下数据：

var moves = [

  {index: 3, type: 0},

  {index: 3, type: 0},

  {index: 3, type: 0}

];

再执行如下代码：

var j = i = 0;

while (i < newList.length) {

  item = newList[i];

  itemKey = getItemKey(item, key);

  var simulateItem = simulateList[j];

  var simulateItemKey = getItemKey(simulateItem, key);

  if (simulateItem) {

    if (itemKey === simulateItemKey) {

      j++;

    } else {

      // 新的一项，插入

      if (!oldKeyIndex.hasOwnProperty(itemKey)) {

        insert(i, item);

      } else {

        var nextItemKey = getItemKey(simulateList[j + 1], key);

        if (nextItemKey === itemKey) {

          remove(i);

          removeSimulate(j);

          j++;

        } else {

          insert(i, item);

        }

      }

    }

  } else {

    insert(i, item);

  }

  i++;

}

遍历新节点数据newList var newList = [{id: 2}, {id: 3}, {id: 1}]; 然后 itemKey = getItemKey(item, key); 那么itemKey=2, 3, 1
var simulateItem = simulateList[j];
simulateList的值如下：

simulateList = [

  {id： 1},

  {id:  2},

  {id:  3}

];

获取simulateList数组中的某一项，然后
var simulateItemKey = getItemKey(simulateItem, key);
因此 simulateItemKey值依次变为1， 2， 3; 先循环最外层的新数据 2， 3，1，然后在循环内层旧数据 1, 2 ,3,
判断 itemKey === simulateItemKey 是否相等，相等的话什么都不做，执行下一次循环，j++; 否则的话，先判断是否在旧节点oldKeyIndex
能否找到新节点的值；oldKeyIndex 数据如下：

{

  1: 0,

  2: 1,

  3: 2,

  4: 3,

  5: 4,

  6: 5

}

如果没有找到该键名的话，说明该新节点数据项就是新增的，那就新增一项，新增的代码如下：

function insert(index, item) {

  var move = {index: index, item: item, type: 1};

  moves.push(move);

}

因此moves代码继续新增一项，type为1就是新增的。否则的话，获取simulateList中的下一个数据值，进行对比，如果能找到的话，执行remove(i)方法，因此moves再新加一项
{type:0, index: i}; 此时 j = 0; 删除原数组的第一项，然后继续循环上面一样的操作。

整个思路重新整理一遍：

var before = [{id: 1}, {id: 2}, {id: 3}, {id: 4}, {id: 5}, {id: 6}];
var after = [{id: 4}, {id: 3}, {id: 2},{id: 1}];
var diffs = diff.diff(before, after, 'id');

上面的代码初始化，原数据 before，新数据 after，key键为id，
oldMap 值为：

oldMap = {

  keyIndex: {

    1: 0,

    2: 1,

    3: 2,

    4: 3,

    5: 4,

    6: 5

  }

}

newMap的值为

newMap = {

  keyIndex: {

    1: 3,

    2: 2,

    3: 1,

    4: 0

  }

}

oldKeyIndex = oldMap.keyIndex = {

  1: 0,

  2: 1,

  3: 2,

  4: 3,

  5: 4,

  6: 5

}

var newKeyIndex = newMap.keyIndex = {

  1: 3,

  2: 2,

  3: 1,

  4: 0

};

遍历 before，获取某一项的值，因此分别为1，2，3，4，5，6；判断newKeyIndex是否有该值，如果没有的话，该它置为null，保存到 children数组里面去；
因此

children = [

  {id: 1},

  {id: 2},

  {id: 3},

  {id: 4},

  null,

  null

]

把children赋值到 simulateList 数组里面去，然后对simulateList数组去掉null值，因此simulateList值变为如下：

simulateList = [

  {id: 1},

  {id: 2},

  {id: 3},

  {id: 4}

]

moves = [

  {

    type: 0,

    index: 4

  },

  {

    type: 0,

    index: 4

  }

]

最后遍历新节点 newList = [{id: 4}, {id: 3}, {id: 2},{id: 1}]; 获取该键值分别为：4, 3, 2, 1;
获取源数组simulateList里面的键值为 1, 2 , 3, 4;

所以 4, 3, 2, 1 遍历和 1, 2, 3, 4 遍历判断是否相等思路如下：
1. 遍历newList键值为 4，先和 1比较，如果相等的话，j++，跳到下一个内部循环，否则的话，先判断该键是否在oldKeyIndex里面，如果不存在的话，说明是新增的，否则的话就进入else语句，判断simulateList下一个值2 是否和 4 相等，不相等的话，直接插入值到数组的第一个位置上去，因此 moves的值变为如下：

moves = [

    {

      type: 0,

      index: 4

    },

    {

      type: 0,

      index: 4

    },

    {

      type: 1,

      index: 0,

      item: {id: 4}

    }

]

2. 同样的道理，把遍历newList的第二项 3，和第一步一样的操作，最后3也是新增的，如下moves的值变为如下：

moves = [

    {

      type: 0,

      index: 4

    },

    {

      type: 0,

      index: 4

    },

    {

      type: 1,

      index: 0,

      item: {id: 4}

    },

    {

      type: 1,

      index: 1,

      item: {id: 3}

    }

]

3. 同样，遍历newList的第三项值为2，和第一步操作，进入else语句，第一个值不符合，接着遍历第二个值，相等，就做删除操作，因此moves变为如下值：

moves = [

    {

      type: 0,

      index: 4

    },

    {

      type: 0,

      index: 4

    },

    {

      type: 1,

      index: 0,

      item: {id: 4}

    },

    {

      type: 1,

      index: 1,

      item: {id: 3}

    },

    {

      type: 0,

      index: 2

    }

]

且 oldList被删除一项，此时j = 0, 所以被删除掉第一项因此 oldList = [2, 3, 4];

4. 同样，遍历 newList的第四项值为 1，和第一步操作一样，值都不相等，因此做插入操作，因此moves值变为

moves = [

    {

      type: 0,

      index: 4

    },

    {

      type: 0,

      index: 4

    },

    {

      type: 1,

      index: 0,

      item: {id: 4}

    },

    {

      type: 1,

      index: 1,

      item: {id: 3}

    },

    {

      type: 0,

      index: 2

    },

    {

      type: 1,

      index: 3,

      item: {id: 1}

    }

]

最后以对象的方式返回 moves 和 children。

diff.js 列表对比算法源码分析的更多相关文章

mahout算法源码分析之Collaborative Filtering with ALS-WR 并行思路
Mahout版本:0.7,hadoop版本:1.0.4,jdk:1.7.0_25 64bit. mahout算法源码分析之Collaborative Filtering with ALS-WR 这个算 ...
mahout算法源码分析之Collaborative Filtering with ALS-WR （四）评价和推荐
Mahout版本:0.7,hadoop版本:1.0.4,jdk:1.7.0_25 64bit. 首先来总结一下 mahout算法源码分析之Collaborative Filtering with AL ...
mahout算法源码分析之Collaborative Filtering with ALS-WR拓展篇
Mahout版本:0.7,hadoop版本:1.0.4,jdk:1.7.0_25 64bit. 额,好吧,心头的一块石头总算是放下了.关于Collaborative Filtering with AL ...
Backbone.js 0.9.2 源码分析收藏
Backbone 为复杂Javascript应用程序提供模型(models).集合(collections).视图(views)的结构.其中模型用于绑定键值数据和自定义事件:集合附有可枚举函数的丰富A ...
Underscore.js 1.3.3 源码分析收藏
Underscore是一个提供许多函数编程功能的库,里面包含了你期待(在Prototype.js和Ruby中)的许多功能.但是没有扩展任何内置的Javascript对象,也就是说它没有扩展任何内置对象 ...
js菜鸟进阶-jQuery源码分析(1)-基本架构
导读: 本人JS菜鸟一枚,为加强代码美观和编程思想.所以来研究下jQuery,有需要进阶JS的同学很适合阅读此文!我是边看代码(jquery2.2.1),边翻“javascript高级程序设计”写的, ...
html5 Sortable.js 拖拽排序源码分析
最近公司项目经常用到一个拖拽 Sortable.js插件,所以有空的时候看了 Sortable.js 源码,总共1300多行这样,写的挺完美的. 本帖属于原创,转载请出名出处. 官网http:// ...
朴素贝叶斯算法源码分析及代码实战【python sklearn/spark ML】
一.简介贝叶斯定理是关于随机事件A和事件B的条件概率的一个定理.通常在事件A发生的前提下事件B发生的概率,与在事件B发生的前提下事件A发生的概率是不一致的.然而,这两者之间有确定的关系,贝叶斯定理就 ...
BeanUtils对象属性copy的性能对比以及源码分析
1. 对象属性拷贝的常见方式及其性能在日常编码中,经常会遇到DO.DTO对象之间的转换,如果对象本身的属性比较少的时候,那么我们采用硬编码手工setter也还ok,但如果对象的属性比较多的情况下,手 ...

随机推荐

centOS(redhat/oracle linux更换语言
编辑/etc/sysconfig/i18n将LANG=”zh_CN.UTF-8″ 改为 LANG=”en_US.UTF-8″ 或其他语言中文乱码将LANG=”zh_CN.UTF-8″改为LANG=”z ...
C++ STL set详解
一.解释 p { margin-bottom: 0.25cm; direction: ltr; color: #000000; line-height: 120%; text-align: justi ...
如何恢复未释放租约的HDFS文件
之前有文章介绍过HDFS租约带来的问题,导致spark应用无法正常读取文件,只能将异常文件找出并且删除后,任务才能继续执行. 但是删除文件实在是下下策,而且文件本身其实并未损坏,只是因为已经close ...
ue4(c++) 按钮中的文字居中的问题
.Content() [ SNew(SOverlay) + SOverlay::Slot().HAlign(HAlign_Center).VAlign(VAlign_Center) [ SNew( ...
在自学java路上遇上的南墙
从2016年12月20号自学java,先是咨询了下培训中心,得小两万,四个月毕业,算了一笔账,一百二十天,合下来每天三百多块,再加上开销之类压力太大,于是开始入坑自学,随后血一般的教训直面而来: 1. ...
Xcode调试时查看变量的方法
在Debug Console窗口中(lldb)后可以使用两个指令: 1.print 变量名:打印出变量值 2.po 对象名:print object,打印出对象中的值: 另外,Command+Shif ...
一个普通的 Zepto 源码分析（二） - ajax 模块
一个普通的 Zepto 源码分析(二) - ajax 模块普通的路人,普通地瞧.分析时使用的是目前最新 1.2.0 版本. Zepto 可以由许多模块组成,默认包含的模块有 zepto 核心模块,以 ...
MySQL执行计划extra中的using index 和 using where using index 的区别
本文出处:http://www.cnblogs.com/wy123/p/7366486.html (保留出处并非什么原创作品权利,本人拙作还远远达不到,仅仅是为了链接到原文,因为后续对可能存在的一些错 ...
ssh相关问题
问题1 一般错误信息为:ssh: connect to host localhost port 22: Connection refused 这种错误很主要的一个原因是sshd服务没有启动,先启动ss ...
Oracle基础--命令
====================== 基础命令====================== 1.su – oracle 不是必需,适合于没有DBA密码时使用,可以不用密码来进入sqlplus界 ...

diff.js 列表对比算法 源码分析

diff.js 列表对比算法 源码分析的更多相关文章

随机推荐

热门专题

diff.js 列表对比算法源码分析

diff.js 列表对比算法源码分析的更多相关文章