zoukankan      html  css  js  c++  java
  • .38-浅析webpack源码之读取babel-loader并转换js文件

      经过非常非常长无聊的流程,只是将获取到的module信息做了一些缓存,然后生成了loaderContext对象。

      这里上个图整理一下这节的流程:

      这一节来看webpack是如何将babel-loader与js文件结合的,首先总览一下runLoaders函数:

    /*
        options => 
        {
            resource: 'd:\workspace\doc\input.js',
            loaders: [ { loader: 'd:\workspace\node_modules\babel-loader\lib\index.js' } ],
            context: loaderContext,
            readResource: fs.readFile.bind(fs)
        }
    */
    exports.runLoaders = function runLoaders(options, callback) {
        // read options
        var resource = options.resource || "";
        var loaders = options.loaders || [];
        var loaderContext = options.context || {};
        var readResource = options.readResource || readFile;
    
        // 简单讲就是获取入口文件的绝对路径、参数、目录
        var splittedResource = resource && splitQuery(resource);
        var resourcePath = splittedResource ? splittedResource[0] : undefined;
        var resourceQuery = splittedResource ? splittedResource[1] : undefined;
        var contextDirectory = resourcePath ? dirname(resourcePath) : null;
    
        // execution state
        var requestCacheable = true;
        var fileDependencies = [];
        var contextDependencies = [];
    
        // prepare loader objects
        loaders = loaders.map(createLoaderObject);
    
        // 将属性都挂载到loaderContext上面
        loaderContext.context = contextDirectory;
        loaderContext.loaderIndex = 0;
        loaderContext.loaders = loaders;
        loaderContext.resourcePath = resourcePath;
        loaderContext.resourceQuery = resourceQuery;
        loaderContext.async = null;
        loaderContext.callback = null;
        loaderContext.cacheable = function cacheable(flag) {
            if (flag === false) {
                requestCacheable = false;
            }
        };
        loaderContext.dependency = loaderContext.addDependency = function addDependency(file) {
            fileDependencies.push(file);
        };
        loaderContext.addContextDependency = function addContextDependency(context) {
            contextDependencies.push(context);
        };
        loaderContext.getDependencies = function getDependencies() {
            return fileDependencies.slice();
        };
        loaderContext.getContextDependencies = function getContextDependencies() {
            return contextDependencies.slice();
        };
        loaderContext.clearDependencies = function clearDependencies() {
            fileDependencies.length = 0;
            contextDependencies.length = 0;
            requestCacheable = true;
        };
        // 定义大量的特殊属性
        Object.defineProperty(loaderContext, "resource", {
            enumerable: true,
            get: function() {
                if (loaderContext.resourcePath === undefined)
                    return undefined;
                return loaderContext.resourcePath + loaderContext.resourceQuery;
            },
            set: function(value) {
                var splittedResource = value && splitQuery(value);
                loaderContext.resourcePath = splittedResource ? splittedResource[0] : undefined;
                loaderContext.resourceQuery = splittedResource ? splittedResource[1] : undefined;
            }
        });
        // ...大量Object.defineProperty
    
        // finish loader context
        if (Object.preventExtensions) {
            Object.preventExtensions(loaderContext);
        }
    
        var processOptions = {
            resourceBuffer: null,
            readResource: readResource
        };
        iteratePitchingLoaders(processOptions, loaderContext, function(err, result) {
            if (err) {
                return callback(err, {
                    cacheable: requestCacheable,
                    fileDependencies: fileDependencies,
                    contextDependencies: contextDependencies
                });
            }
            callback(null, {
                result: result,
                resourceBuffer: processOptions.resourceBuffer,
                cacheable: requestCacheable,
                fileDependencies: fileDependencies,
                contextDependencies: contextDependencies
            });
        });
    };

      传入的4个参数都很直白:

    1、待处理文件绝对路径

    2、文件后缀对应的loader入口文件绝对路径

    3、对应的loaderContext对象

    4、fs对象

      前面所有的事都是为了生成前3个属性,在这里整合在一起开始做转换处理。

    createLoaderObject

      这里有一个需要简单看的地方,就是对loaders数组做了一封封装:

    // prepare loader objects
    loaders = loaders.map(createLoaderObject);

      简单看一下这个函数:

    function createLoaderObject(loader) {
        var obj = {
            path: null,
            query: null,
            options: null,
            ident: null,
            normal: null,
            pitch: null,
            raw: null,
            data: null,
            pitchExecuted: false,
            normalExecuted: false
        };
        // 定义request属性的get/set
        Object.defineProperty(obj, "request", {
            enumerable: true,
            get: function() {
                return obj.path + obj.query;
            },
            set: function(value) {
                if (typeof value === "string") {
                    var splittedRequest = splitQuery(value);
                    obj.path = splittedRequest[0];
                    obj.query = splittedRequest[1];
                    obj.options = undefined;
                    obj.ident = undefined;
                } else {
                    // value => { loader: 'd:\workspace\node_modules\babel-loader\lib\index.js' }
                    if (!value.loader)
                        throw new Error("request should be a string or object with loader and object (" + JSON.stringify(value) + ")");
                    // 这么多行代码其实只有第一行有用
                    // 即obj.path = 'd:\workspace\node_modules\babel-loader\lib\index.js'
                    obj.path = value.loader;
                    obj.options = value.options;
                    obj.ident = value.ident;
                    if (obj.options === null)
                        obj.query = "";
                    else if (obj.options === undefined)
                        obj.query = "";
                    else if (typeof obj.options === "string")
                        obj.query = "?" + obj.options;
                    else if (obj.ident)
                        obj.query = "??" + obj.ident;
                    else if (typeof obj.options === "object" && obj.options.ident)
                        obj.query = "??" + obj.options.ident;
                    else
                        obj.query = "?" + JSON.stringify(obj.options);
                }
            }
        });
        // 这里会触发上面的set
        obj.request = loader;
        // 封装
        if (Object.preventExtensions) {
            Object.preventExtensions(obj);
        }
        return obj;
    }

      最后做封装,然后返回一个obj。

      将属性全部挂载在loaderContext上面,最后也是调用Object.preventExtensions将属性冻结,禁止添加任何新的属性。

      完成对象的安装后,最后调用了迭代器方法,这里看一下iteratePitchingLoaders方法内部实现:

    function iteratePitchingLoaders(options, loaderContext, callback) {
        // abort after last loader
        // loaderIndex初始为0
        if (loaderContext.loaderIndex >= loaderContext.loaders.length)
            return processResource(options, loaderContext, callback);
    
        // 取出之前的obj
        var currentLoaderObject = loaderContext.loaders[loaderContext.loaderIndex];
    
        // iterate
        // 默认是false 代表当前loader未被加载过
        if (currentLoaderObject.pitchExecuted) {
            loaderContext.loaderIndex++;
            return iteratePitchingLoaders(options, loaderContext, callback);
        }
    
        // load loader module
        loadLoader(currentLoaderObject, function(err) {
            // ...
        });
    }

      取出来loader对象后,调用loadLoader来加载loader,看一眼:

    module.exports = function loadLoader(loader, callback) {
        // 不知道这个System是什么环境下的变量
        // node环境是global
        // 浏览器环境是window
        if (typeof System === "object" && typeof System.import === "function") {
            // ...
        } else {
            try {
                // 直接尝试读取路径的文件
                var module = require(loader.path);
            } catch (e) {
                // it is possible for node to choke on a require if the FD descriptor
                // limit has been reached. give it a chance to recover.
                // 因为可能出现阻塞情况 所以这里会进行重试
                if (e instanceof Error && e.code === "EMFILE") {
                    var retry = loadLoader.bind(null, loader, callback);
                    if (typeof setImmediate === "function") {
                        // node >= 0.9.0
                        return setImmediate(retry);
                    } else {
                        // node < 0.9.0
                        return process.nextTick(retry);
                    }
                }
                return callback(e);
            }
            if (typeof loader !== "function" && typeof loader !== "object")
                throw new Error("Module '" + loader.path + "' is not a loader (export function or es6 module))");
            // babel-loader返回的module是一个function
            loader.normal = typeof module === "function" ? module : module.default;
            loader.pitch = module.pitch;
            loader.raw = module.raw;
            if (typeof loader.normal !== "function" && typeof loader.pitch !== "function")
                throw new Error("Module '" + loader.path + "' is not a loader (must have normal or pitch function)");
            callback();
        }
    };

      这里就涉及到loader的返回值,通过直接读取babel-loader的入口文件,最后返回了一个function,后面两个属性babel-loader并没有给,是undefined。

      这里把babel-loader返回值挂载到loader上后,就调用了无参回调函数,如下:

    loadLoader(currentLoaderObject, function(err) {
        if (err) return callback(err);
        // 刚才也说了这个是undefined
        var fn = currentLoaderObject.pitch;
        // 这个表明loader已经被调用了 下次再遇到就会直接跳过
        currentLoaderObject.pitchExecuted = true;
        if (!fn) return iteratePitchingLoaders(options, loaderContext, callback);
    
        runSyncOrAsync(
            fn,
            loaderContext, [loaderContext.remainingRequest, loaderContext.previousRequest, currentLoaderObject.data = {}],
            function(err) {
                if (err) return callback(err);
                var args = Array.prototype.slice.call(arguments, 1);
                if (args.length > 0) {
                    loaderContext.loaderIndex--;
                    iterateNormalLoaders(options, loaderContext, args, callback);
                } else {
                    iteratePitchingLoaders(options, loaderContext, callback);
                }
            }
        );
    });

      这里把loader的一个标记置true,然后根据返回函数是否有pitch值来决定流程,很明显这里直接递归调用自身了。

      第二次进来时,由于loader已经被加载,所以loaderIndex加1,然后再次递归。

      第三次进来时,第一个判断中表明所有的loader都被加载完,会调用processResource方法。

    processResource

      这里的递归由于都是尾递归,所以在性能上不会有问题,直接看上面的方法:

    // options => 包含fs方法的对象
    // loaderContext => 包含loader路径、返回值等的对象
    function processResource(options, loaderContext, callback) {
        // 从后往前调用loader
        loaderContext.loaderIndex = loaderContext.loaders.length - 1;
    
        // 获取入口文件路径
        var resourcePath = loaderContext.resourcePath;
        if (resourcePath) {
            /*
                loaderContext.dependency = loaderContext.addDependency = function addDependency(file) {
                    fileDependencies.push(file);
                };
            */
            loaderContext.addDependency(resourcePath);
            // readResource => fs.readFile
            options.readResource(resourcePath, function(err, buffer) {
                if (err) return callback(err);
                options.resourceBuffer = buffer;
                iterateNormalLoaders(options, loaderContext, [buffer], callback);
            });
        } else {
            iterateNormalLoaders(options, loaderContext, [null], callback);
        }
    }

      这个获取入口文件路径并调用fs模块进行文件内容读取,返回文件的原始buffer后调用了iterateNormalLoaders方法。

    function iterateNormalLoaders(options, loaderContext, args, callback) {
        // 当所有loader执行完后返回
        if (loaderContext.loaderIndex < 0)
            return callback(null, args);
        // 取出当前的loader
        var currentLoaderObject = loaderContext.loaders[loaderContext.loaderIndex];
    
        // iterate
        // 默认为false 跟另外一个标记类似 代表该loader在此方法是否被调用过
        if (currentLoaderObject.normalExecuted) {
            loaderContext.loaderIndex--;
            return iterateNormalLoaders(options, loaderContext, args, callback);
        }
        // 读取返回的module
        var fn = currentLoaderObject.normal;
        // 标记置true
        currentLoaderObject.normalExecuted = true;
        if (!fn) {
            return iterateNormalLoaders(options, loaderContext, args, callback);
        }
        /*
            function convertArgs(args, raw) {
                if (!raw && Buffer.isBuffer(args[0]))
                    args[0] = utf8BufferToString(args[0]);
                else if (raw && typeof args[0] === "string")
                    args[0] = new Buffer(args[0], "utf-8");
            }
            function utf8BufferToString(buf) {
                var str = buf.toString("utf-8");
                if (str.charCodeAt(0) === 0xFEFF) {
                    return str.substr(1);
                } else {
                    return str;
                }
            }
        */
        // 该方法将原始的buffer转换为utf-8的字符串
        convertArgs(args, currentLoaderObject.raw);
    
        runSyncOrAsync(fn, loaderContext, args, function(err) {
            if (err) return callback(err);
    
            var args = Array.prototype.slice.call(arguments, 1);
            iterateNormalLoaders(options, loaderContext, args, callback);
        });
    }

      这里的normal就是处理普通的js文件了,在读取入口文件后将其转换为utf-8的格式,然后依次获取loader,调用runSyncOrAsync。

      源码如下:

    /*
        fn => 读取babel-loader返回的函数
        context => loader的辅助对象
        args => 读取入口文件返回的字符串
    */
    function runSyncOrAsync(fn, context, args, callback) {
        var isSync = true;
        var isDone = false;
        var isError = false; // internal error
        var reportedError = false;
        context.async = function async() {
            if (isDone) {
                if (reportedError) return; // ignore
                throw new Error("async(): The callback was already called.");
            }
            isSync = false;
            return innerCallback;
        };
        // 封装成执行一次的回调函数
        var innerCallback = context.callback = function() {
            if (isDone) {
                if (reportedError) return; // ignore
                throw new Error("callback(): The callback was already called.");
            }
            isDone = true;
            isSync = false;
            try {
                callback.apply(null, arguments);
            } catch (e) {
                isError = true;
                throw e;
            }
        };
        try {
            // 可以可以
            // 老子看了这么久源码就是等这个方法
            // 还装模作样的弄个IIFE
            var result = (function LOADER_EXECUTION() {
                return fn.apply(context, args);
            }());
            if (isSync) {
                isDone = true;
                if (result === undefined)
                    return callback();
                // 根据转换后的类型二次处理
                if (result && typeof result === "object" && typeof result.then === "function") {
                    return result.catch(callback).then(function(r) {
                        callback(null, r);
                    });
                }
                return callback(null, result);
            }
        } catch (e) {
            if (isError) throw e;
            if (isDone) {
                // loader is already "done", so we cannot use the callback function
                // for better debugging we print the error on the console
                if (typeof e === "object" && e.stack) console.error(e.stack);
                else console.error(e);
                return;
            }
            isDone = true;
            reportedError = true;
            callback(e);
        }
    }

      看了那么多的垃圾代码,终于来到了最关键的方法,可以看出,本质上loader就是将读取到的字符串传入,然后返回对应的字符串或者一个Promise。

      这里一路将结果一路返回到了最初的runLoaders方法中:

    iteratePitchingLoaders(processOptions, loaderContext, function(err, result) {
        if (err) {
            return callback(err, {
                cacheable: requestCacheable,
                fileDependencies: fileDependencies,
                contextDependencies: contextDependencies
            });
        }
        /*
            result => babel-loader转换后的字符串
            resourceBuffer => JS文件的原始buffer
            cacheable => [Function]
            fileDependencies => ['d:\workspace\doc\input.js']
            contextDependencies => []
        */
        callback(null, {
            result: result,
            resourceBuffer: processOptions.resourceBuffer,
            cacheable: requestCacheable,
            fileDependencies: fileDependencies,
            contextDependencies: contextDependencies
        });
    });

      因为案例比较简单,所以返回的东西也比较少,这里继续callback,返回到doBuild:

    doBuild(options, compilation, resolver, fs, callback) {
        this.cacheable = false;
        const loaderContext = this.createLoaderContext(resolver, options, compilation, fs);
        runLoaders({
            resource: this.resource,
            loaders: this.loaders,
            context: loaderContext,
            readResource: fs.readFile.bind(fs)
        }, (err, result) => {
            // result => 上面的对象
            if (result) {
                this.cacheable = result.cacheable;
                this.fileDependencies = result.fileDependencies;
                this.contextDependencies = result.contextDependencies;
            }
    
            if (err) {
                const error = new ModuleBuildError(this, err);
                return callback(error);
            }
            // 获取对应的原始buffer、转换后的字符串、sourceMap
            const resourceBuffer = result.resourceBuffer;
            const source = result.result[0];
            // null
            const sourceMap = result.result[1];
    
            if (!Buffer.isBuffer(source) && typeof source !== "string") {
                const error = new ModuleBuildError(this, new Error("Final loader didn't return a Buffer or String"));
                return callback(error);
            }
            /*
                function asString(buf) {
                    if (Buffer.isBuffer(buf)) {
                        return buf.toString("utf-8");
                    }
                    return buf;
                }
            */
            this._source = this.createSource(asString(source), resourceBuffer, sourceMap);
            return callback();
        });
    }

      这次获取处理完的对象属性,然后调用另外一个createSource方法:

    createSource(source, resourceBuffer, sourceMap) {
        // if there is no identifier return raw source
        if (!this.identifier) {
            return new RawSource(source);
        }
    
        // from here on we assume we have an identifier
        // 返回下面这个东西 很久之前拼接的
        // d:workspace
    ode_modulesabel-loaderlibindex.js!d:workspacedocinput.js
        const identifier = this.identifier();
        // 下面两个属性根本没出现过
        if (this.lineToLine && resourceBuffer) {
            return new LineToLineMappedSource(
                source, identifier, asString(resourceBuffer));
        }
    
        if (this.useSourceMap && sourceMap) {
            return new SourceMapSource(source, identifier, sourceMap);
        }
        // 直接进这里
        /*
            class OriginalSource extends Source {
                constructor(value, name) {
                    super();
                    this._value = value;
                    this._name = name;
                }
    
                //...原型方法
            }
        */
        return new OriginalSource(source, identifier);
    }

      因为都比较简单,所以直接看注释就好了,没啥好解释的。

      所有的new都只看看构造函数,方法那么多,又不是全用。

      返回的对象赋值给了NormalModule对象的_source属性,然后又是callback,这次回到了build那里:

    build(options, compilation, resolver, fs, callback) {
        this.buildTimestamp = Date.now();
        this.built = true;
        this._source = null;
        this.error = null;
        this.errors.length = 0;
        this.warnings.length = 0;
        this.meta = {};
    
        return this.doBuild(options, compilation, resolver, fs, (err) => {
            this.dependencies.length = 0;
            this.variables.length = 0;
            this.blocks.length = 0;
            this._cachedSource = null;
    
            // if we have an error mark module as failed and exit
            if (err) {
                this.markModuleAsErrored(err);
                return callback();
            }
    
            // check if this module should !not! be parsed.
            // if so, exit here;
            // undefined跳过
            const noParseRule = options.module && options.module.noParse;
            if (this.shouldPreventParsing(noParseRule, this.request)) {
                return callback();
            }
    
            try {
                this.parser.parse(this._source.source(), {
                    current: this,
                    module: this,
                    compilation: compilation,
                    options: options
                });
            } catch (e) {
                const source = this._source.source();
                const error = new ModuleParseError(this, source, e);
                this.markModuleAsErrored(error);
                return callback();
            }
            return callback();
        });
    }

      基本上不知道module.noParser选项哪个人会用,所以这里一般都是直接跳过然后调用那个可怕对象parser对象的parse方法,开始进行解析。

      这节的内容就这样吧,总算是把loader跑完了,这个系列的目的也就差不多了。

      其实总体来说过程就几步,但是代码的复杂程度真的是不想说了……

  • 相关阅读:
    WPF 绘图 和动画
    BZOJ 4028 分块
    操作系统与计算机网络
    go排序-基数排序
    go排序-睡眠排序
    go排序-堆排序
    go排序-构建大顶堆
    go排序 插入排序
    go排序-选择排序
    go排序-冒泡排序
  • 原文地址:https://www.cnblogs.com/QH-Jimmy/p/8494394.html
Copyright © 2011-2022 走看看