gulp源码解析之任务管理-CSDN博客

提到前端工程的自动化构建，gulp是其中很重要的一个工具，gulp是一种基于stream的前端构建工具，相比于grunt使用临时文件的策略，会有较大的速度优势。本文会对gulp的主要部分进行详细剖析，期待本文能够帮助读者更好地在工程中实践gulp。

gulp等前端构建脚本并不是一种全新的思想，早在几十年前，gnu make已经在各种流行语言中风靡，并解决了相关的各种问题，可以简单的认为gulp是JavaScript语言的“make”。

Gulp 核心模块

gulp其中两大核心模块，任务管理和文件

本文通过对Orchestrator任务管理模块的源码进行分析，理清gulp是如何进行任务管理的。

通过查看gulp源码（3.x及之前的版本），可以看到，gulp所有任务管理相关的功能都是直接从Orchestrator模块继承的，而且可以发现gulp官网对相关任务管理接口的描述，和Orchestrator模块的描述几乎完全一样。

// gulp/index.js
...
var Orchestrator = require('orchestrator');
...

function Gulp() {  // 构造函数直接调用Orchestrator
  Orchestrator.call(this);
}

util.inherits(Gulp, Orchestrator);  // 从Orchestrator继承而来

Gulp.prototype.task = Gulp.prototype.add;  // task方法直接使用Orchestrator中的add
...复制代码

所以下面就一起来分析一下Orchestrator模块。

Orchestrator 模块

Orchestrator github主页中对自身的描述

A module for sequencing and executing tasks and dependencies in maximum concurrency.

简单翻译就是

一个能够以最大并发性对任务及其依赖任务进行排序执行的模块。

Orchestrator模块主要就是添加管理执行任务，并对任务的执行提供异步支持，分别对应

add - 添加任务

add用于添加任务，传入任务task的名字，依赖数组，以及任务回调函数。
orchestrator中使用核心属性tasks对象保存各个任务
start - 执行任务

start用于执行之前定义的任务，如果传入多个任务，start会进行合并，依次放入到任务数组，然后对任务数组序列按照依赖关系进行去重排序，最终对排序的任务数组依次执行

下面是具有完整注释的源码。

// Orchestrator/index.js

/*jshint node:true */

"use strict";

var util = require('util');
var events = require('events');
var EventEmitter = events.EventEmitter;
var runTask = require('./lib/runTask');

/*
 构造函数里面
 首先调用node中事件模块的构造函数EventEmitter，

 EventEmitter.call(this);

 这是一种典型的用法，直接挂载Event模块实例属性及方法。

 接下来初始化了Orchestrator最核心的几个属性：

 doneCallback 是所有任务执行完成后的回调
 seq 是排序后的任务队列，对任务及其依赖的排序是通过seqencify模块进行的，后面会介绍。
 tasks 保存了所有定义的任务，通过add原型方法添加任务。
 isRunning 标识当前是否有任务正在执行
*/
var Orchestrator = function () {
    EventEmitter.call(this);
    this.doneCallback = undefined; // call this when all tasks in the queue are done
    this.seq = []; // the order to run the tasks
    this.tasks = {}; // task objects: name, dep (list of names of dependencies), fn (the task to run)
    this.isRunning = false; // is the orchestrator running tasks? .start() to start, .stop() to stop
};

/*
 * 继承Event模块
 */
util.inherits(Orchestrator, EventEmitter);

/*
 * 重置Orchestrator模块，即重置orchestrator实例的相应状态和属性
 */
Orchestrator.prototype.reset = function () {
    if (this.isRunning) {
        this.stop(null);
    }
    this.tasks = {};
    this.seq = [];
    this.isRunning = false;
    this.doneCallback = undefined;
    return this;
};

/*
  add前面主要是对参数进行了一些校验检测，最后将任务task的名字，依赖，回调添加到核心属性tasks中
*/
Orchestrator.prototype.add = function (name, dep, fn) {
    if (!fn && typeof dep === 'function') {
        fn = dep;
        dep = undefined;
    }
    dep = dep || [];
    fn = fn || function () {}; // no-op
    if (!name) {
        throw new Error('Task requires a name');
    }
    // validate name is a string, dep is an array of strings, and fn is a function
    if (typeof name !== 'string') {
        throw new Error('Task requires a name that is a string');
    }
    if (typeof fn !== 'function') {
        throw new Error('Task '+name+' requires a function that is a function');
    }
    if (!Array.isArray(dep)) {
        throw new Error('Task '+name+' can\'t support dependencies that is not an array of strings');
    }
    dep.forEach(function (item) {
        if (typeof item !== 'string') {
            throw new Error('Task '+name+' dependency '+item+' is not a string');
        }
    });
    this.tasks[name] = {
        fn: fn,
        dep: dep,
        name: name
    };
    return this;
};

/*
  如果只给了task的名字，则直接获取之前定义task，否则通过add添加新的task
*/
Orchestrator.prototype.task = function (name, dep, fn) {
    if (dep || fn) {
        // alias for add, return nothing rather than this
        this.add(name, dep, fn);
    } else {
        return this.tasks[name];
    }
};

/*
  判断是否已经定义了某个task
*/
Orchestrator.prototype.hasTask = function (name) {
    return !!this.tasks[name];
};

/*
 * 开始运行任务
 * 首先会判断传入参数最后一个是否为函数，如果是，则作为所有任务
 * 结束后的回调，否则也会将其当做一个任务
 * 
 * 依次循环收集最后一个参数之前的所有参数（如果最后一个参数不是
 * 函数，也将其收集），放入任务数组；
 * 
 * 对任务数组序列按照依赖关系进行去重排序
 * 
 * 调用runStep依次执行排序后的任务数组
 */
Orchestrator.prototype.start = function() {
    var args, arg, names = [], lastTask, i, seq = [];
    args = Array.prototype.slice.call(arguments, 0);
    if (args.length) {
        lastTask = args[args.length-1];
        if (typeof lastTask === 'function') {
            this.doneCallback = lastTask;
            args.pop();
        }
        for (i = 0; i < args.length; i++) {
            arg = args[i];
            if (typeof arg === 'string') {
                names.push(arg);
            } else if (Array.isArray(arg)) {
                names = names.concat(arg); // FRAGILE: ASSUME: it's an array of strings
            } else {
                throw new Error('pass strings or arrays of strings');
            }
        }
    }
    if (this.isRunning) {
        // reset specified tasks (and dependencies) as not run
        this._resetSpecificTasks(names);
    } else {
        // reset all tasks as not run
        this._resetAllTasks();
    }
    if (this.isRunning) {
        // if you call start() again while a previous run is still in play
        // prepend the new tasks to the existing task queue
        names = names.concat(this.seq);
    }
    if (names.length < 1) {
        // run all tasks
        for (i in this.tasks) {
            if (this.tasks.hasOwnProperty(i)) {
                names.push(this.tasks[i].name);
            }
        }
    }
    seq = [];
    try {
        this.sequence(this.tasks, names, seq, []);
    } catch (err) {
        // Is this a known error?
        if (err) {
            /* sequencify模块会根据以下两种不同情况抛出异常，
             * 一种为任务未定义；另一种为任务序列出现循环依赖
             */
            if (err.missingTask) {
                this.emit('task_not_found', {message: err.message, task:err.missingTask, err: err});
            }
            if (err.recursiveTasks) {
                this.emit('task_recursion', {message: err.message, recursiveTasks:err.recursiveTasks, err: err});
            }
        }
        this.stop(err);
        return this;
    }
    this.seq = seq;
    this.emit('start', {message:'seq: '+this.seq.join(',')});
    if (!this.isRunning) {
        this.isRunning = true;
    }
    this._runStep();
    return this;
};


/* 停止orchestrator实例，根据结束类型的不同，抛出不同的消息
 * 如果定义了回调，则执行回调
 */
Orchestrator.prototype.stop = function (err, successfulFinish) {
    this.isRunning = false;
    if (err) {
        this.emit('err', {message:'orchestration failed', err:err});
    } else if (successfulFinish) {
        this.emit('stop', {message:'orchestration succeeded'});
    } else {
        // ASSUME
        err = 'orchestration aborted';
        this.emit('err', {message:'orchestration aborted', err: err});
    }
    if (this.doneCallback) {
        // Avoid calling it multiple times
        this.doneCallback(err);
    } else if (err && !this.listeners('err').length) {
        // No one is listening for the error so speak louder
        throw err;
    }
};

/*
 * 引入任务及其依赖任务的排序模块
 */
Orchestrator.prototype.sequence = require('sequencify');

/*
  简单的循环判断是否所有的任务都已经执行完毕
*/
Orchestrator.prototype.allDone = function () {
    var i, task, allDone = true; // nothing disputed it yet
    for (i = 0; i < this.seq.length; i++) {
        task = this.tasks[this.seq[i]];
        if (!task.done) {
            allDone = false;
            break;
        }
    }
    return allDone;
};

/*
 * 重置task，重置相应的状态和属性
 */
Orchestrator.prototype._resetTask = function(task) {
    if (task) {
        if (task.done) {
            task.done = false;
        }
        delete task.start;
        delete task.stop;
        delete task.duration;
        delete task.hrDuration;
        delete task.args;
    }
};

/*
 * 循环遍历重置所有的task
 */
Orchestrator.prototype._resetAllTasks = function() {
    var task;
    for (task in this.tasks) {
        if (this.tasks.hasOwnProperty(task)) {
            this._resetTask(this.tasks[task]);
        }
    }
};

/*
 * 循环遍历重置task，并递归重置所依赖的task
 */
Orchestrator.prototype._resetSpecificTasks = function (names) {
    var i, name, t;

    if (names && names.length) {
        for (i = 0; i < names.length; i++) {
            name = names[i];
            t = this.tasks[name];
            if (t) {
                this._resetTask(t);
                if (t.dep && t.dep.length) {
                    this._resetSpecificTasks(t.dep); // recurse
                }
            //} else {
                // FRAGILE: ignore that the task doesn't exist
            }
        }
    }
};

/* 逐个运行任务，当所有任务都结束后，停止orchestrator实例 */
Orchestrator.prototype._runStep = function () {
    var i, task;
    if (!this.isRunning) {
        return; // user aborted, ASSUME: stop called previously
    }
    for (i = 0; i < this.seq.length; i++) {
        task = this.tasks[this.seq[i]];
        if (!task.done && !task.running && this._readyToRunTask(task)) {
            this._runTask(task);
        }
        if (!this.isRunning) {
            return; // task failed or user aborted, ASSUME: stop called previously
        }
    }
    if (this.allDone()) {
        this.stop(null, true);
    }
};

/* 判断当前任务是否能运行，循环判断其所有依赖任务是否运行结束，
 * 只要有一个未定义或未结束，则不能运行
 */
Orchestrator.prototype._readyToRunTask = function (task) {
    var ready = true, // no one disproved it yet
        i, name, t;
    if (task.dep.length) {
        for (i = 0; i < task.dep.length; i++) {
            name = task.dep[i];
            t = this.tasks[name];
            if (!t) {
                // FRAGILE: this should never happen
                this.stop("can't run "+task.name+" because it depends on "+name+" which doesn't exist");
                ready = false;
                break;
            }
            if (!t.done) {
                ready = false;
                break;
            }
        }
    }
    return ready;
};

/* 设置任务的执行时间，重置任务的运行和结束标记 */
Orchestrator.prototype._stopTask = function (task, meta) {
    task.duration = meta.duration;
    task.hrDuration = meta.hrDuration;
    task.running = false;
    task.done = true;
};

/* 停止任务后收集相关的参数（任务名字，执行时间，类型，是否正常结束等抛出消息 */
Orchestrator.prototype._emitTaskDone = function (task, message, err) {
    if (!task.args) {
        task.args = {task:task.name};
    }
    task.args.duration = task.duration;
    task.args.hrDuration = task.hrDuration;
    task.args.message = task.name+' '+message;
    var evt = 'stop';
    if (err) {
        task.args.err = err;
        evt = 'err';
    }
    // 'task_stop' or 'task_err'
    this.emit('task_'+evt, task.args);
};

/*
 * 开始运行任务，并添加任务属性，args，running等
 * 最终通过runTask完成任务回调的执行并最终结束任务
 * runTask接受任务的回调，以及function(err, meta){...}回调函数为参数
 * gulp.task文档中声称对异步任务的支持，正是在runTask中完成的
 * runTask中首先会执行任务的回调函数
 *
 * 第一种对异步支持的方式可以通过向任务回调函数传入一个callback，
 * 执行callback就会调用runTask传入的第二个回调函数参数，进而结束任务
 *
 * 其他方式，如果没有传入callback，runTask中会对任务回调函数的执行
 * 结果进行三种判断，分别为promise，stream流，以及正常同步函数；
 * 对于promise和stream流，同样属于异步任务，promise会在其resolve/rejected
 * 后，调用runTask的第二个回调参数，结束任务；对于stream流，则会在
 * 流结束时刻调用runTask的第二个回调参数，结束任务；
 * 
 * 对于正常同步函数，则直接调用runTask的第二个回调参数，结束任务
 */
Orchestrator.prototype._runTask = function (task) {
    var that = this;

    task.args = {task:task.name, message:task.name+' started'};
    this.emit('task_start', task.args);
    task.running = true;

    runTask(task.fn.bind(this), function (err, meta) {
        that._stopTask.call(that, task, meta);
        that._emitTaskDone.call(that, task, meta.runMethod, err);
        if (err) {
            return that.stop.call(that, err);
        }
        that._runStep.call(that);
    });
};

// FRAGILE: ASSUME: this list is an exhaustive list of events emitted
var events = ['start','stop','err','task_start','task_stop','task_err','task_not_found','task_recursion'];

var listenToEvent = function (target, event, callback) {
    target.on(event, function (e) {
        e.src = event;
        callback(e);
    });
};

/* 监听events中所有类型的函数 */
Orchestrator.prototype.onAll = function (callback) {
    var i;
    if (typeof callback !== 'function') {
        throw new Error('No callback specified');
    }

    for (i = 0; i < events.length; i++) {
        listenToEvent(this, events[i], callback);
    }
};

module.exports = Orchestrator;复制代码

sequencify

sequencify模块主要完成的工作就是针对一个给定的任务数组序列，分析依赖关系，最终给出一个按照任务依赖顺序排列的任务数组序列，然后依次执行各个任务

// sequencify/index.js
/*jshint node:true */

"use strict";

/*
 * 四个输入参数
 * tasks: 当前定义的所有任务
 * names: 需要进行依赖分析的任务数组序列
 * results: 最终得到的按照任务依赖顺序排列的任务数组序列，
 *          并且这个任务序列是去重的
 * nest: 记录当前任务所处的依赖层次路径，比如taskA依赖taskB，
 *       taskB依赖taskC，则分析完taskA后，按照依赖关系，对
 *       taskB分析的时候，nest即为['taskA']，进一步，当分析
 *       taskC时，nest为['taskA', 'taskB']，借此来进行判断是
 *       否有循环依赖。即，如果分析一个任务时，如果其自身在
 *       nest存在，即存在循环依赖，则中断分析，抛出异常。
 */
var sequence = function (tasks, names, results, nest) {
        var i, name, node, e, j;
        nest = nest || [];
        for (i = 0; i < names.length; i++) {
                name = names[i];
                // de-dup results
                /* 任务序列去重 */
                if (results.indexOf(name) === -1) {
                        node = tasks[name];
                        if (!node) {
                            /* 任务不存在则抛出异常 */
                                e = new Error('task "'+name+'" is not defined');
                                e.missingTask = name;
                                e.taskList = [];
                                for (j in tasks) {
                                        if (tasks.hasOwnProperty(j)) {
                                                e.taskList.push(tasks[j].name);
                                        }
                                }
                                throw e;
                        }
                        if (nest.indexOf(name) > -1) {
                            /* 任务序列存在循环依赖，抛出异常 */
                                nest.push(name);
                                e = new Error('Recursive dependencies detected: '+nest.join(' -> '));
                                e.recursiveTasks = nest;
                                e.taskList = [];
                                for (j in tasks) {
                                        if (tasks.hasOwnProperty(j)) {
                                                e.taskList.push(tasks[j].name);
                                        }
                                }
                                throw e;
                        }
                        if (node.dep.length) {
                                nest.push(name);
                                sequence(tasks, node.dep, results, nest); // recurse
                                nest.pop(name);
                        }
                        results.push(name);
                }
        }
};

module.exports = sequence;复制代码