kiwix · Jaifroid · Sep 7, 2019 · Aug 22, 2019 · Aug 22, 2019 · Aug 23, 2019
diff --git a/service-worker.js b/service-worker.js
@@ -23,117 +23,240 @@
  */
 'use strict';
 
-self.addEventListener('install', function(event) {
+/**
+ * The name of the Cache API cache in which assets defined in regexpCachedContentTypes will be stored
+ * The value is defined in app.js and will be passed to Service Worker on initialization (to avoid duplication)
+ * @type {String}
+ */
+var CACHE;
+
+/**
+ * A global Boolean that governs whether CACHE will be used
+ * Caching is on by default but can be turned off by the user in Configuration
+ * @type {Boolean}
+ */
+var useCache = true;
+
+/**  
+ * A regular expression that matches the Content-Types of assets that may be stored in CACHE
+ * Add any further Content-Types you wish to cache to the regexp, separated by '|'
+ * @type {RegExp}
+ */
+var regexpCachedContentTypes = /text\/css|text\/javascript|application\/javascript/i;
+
+/**
+ * A regular expression that excludes listed schemata from caching attempts
+ * As of 08-2019 the chrome-extension: schema is incompatible with the Cache API
+ * 'example-extension' is included to show how to add another schema if necessary
+ * @type {RegExp}
+ */
+var regexpExcludedURLSchema = /^(?:chrome-extension|example-extension):/i;
+
+/** 
+ * Pattern for ZIM file namespace: see https://wiki.openzim.org/wiki/ZIM_file_format#Namespaces
+ * In our case, there is also the ZIM file name used as a prefix in the URL
+ * @type {RegExp}
+ */
+var regexpZIMUrlWithNamespace = /(?:^|\/)([^\/]+\/)([-ABIJMUVWX])\/(.+)/;
+
+self.addEventListener('install', function (event) {
     event.waitUntil(self.skipWaiting());
 });
 
-self.addEventListener('activate', function(event) {
+self.addEventListener('activate', function (event) {
     // "Claiming" the ServiceWorker is necessary to make it work right away,
     // without the need to reload the page.
     // See https://developer.mozilla.org/en-US/docs/Web/API/Clients/claim
     event.waitUntil(self.clients.claim());
 });
 
-var regexpRemoveUrlParameters = new RegExp(/([^?#]+)[?#].*$/);
+var outgoingMessagePort = null;
+var fetchCaptureEnabled = false;
 
-// This function is duplicated from uiUtil.js
-// because using requirejs would force to add the 'fetch' event listener
-// after the initial evaluation of this script, which is not supported any more
-// in recent versions of the browsers.
-// Cf https://bugzilla.mozilla.org/show_bug.cgi?id=1181127
-// TODO : find a way to avoid this duplication
+self.addEventListener('fetch', function (event) {
+    if (fetchCaptureEnabled &&
+        regexpZIMUrlWithNamespace.test(event.request.url) &&
+        event.request.method === "GET") {
 
-/**
- * Removes parameters and anchors from a URL
- * @param {type} url
- * @returns {String} same URL without its parameters and anchors
- */
-function removeUrlParameters(url) {
-    return url.replace(regexpRemoveUrlParameters, "$1");
-}
+        // The ServiceWorker will handle this request either from CACHE or from app.js
 
-var outgoingMessagePort = null;
-var fetchCaptureEnabled = false;
-self.addEventListener('fetch', fetchEventListener);
+        event.respondWith(
+            // First see if the content is in the cache
+            fromCache(event.request).then(
+                function (response) {
+                    // The response was found in the cache so we respond with it 
+                    return response;
+                },
+                function () {
+                    // The response was not found in the cache so we look for it in the ZIM
+                    // and add it to the cache if it is an asset type (css or js)
+                    return fetchRequestFromZIM(event).then(function (response) {
+                        // Add css or js assets to CACHE (or update their cache entries) unless the URL schema is not supported
+                        if (regexpCachedContentTypes.test(response.headers.get('Content-Type')) &&
+                            !regexpExcludedURLSchema.test(event.request.url)) {
+                            event.waitUntil(updateCache(event.request, response.clone()));
+                        }
+                        return response;
+                    }).catch(function (msgPortData, title) {
+                        console.error('Invalid message received from app.js for ' + title, msgPortData);
+                        return msgPortData;
+                    });
+                }
+            )
+        );
+    }
+    // If event.respondWith() isn't called because this wasn't a request that we want to handle,
+    // then the default request/response behavior will automatically be used.
+});
 
 self.addEventListener('message', function (event) {
-    if (event.data.action === 'init') {
-        // On 'init' message, we initialize the outgoingMessagePort and enable the fetchEventListener
-        outgoingMessagePort = event.ports[0];
-        fetchCaptureEnabled = true;
+    if (event.data.action) {
+        if (event.data.action === 'init') {
+            // On 'init' message, we initialize the outgoingMessagePort and enable the fetchEventListener
+            outgoingMessagePort = event.ports[0];
+            fetchCaptureEnabled = true;
+        } else if (event.data.action === 'disable') {
+            // On 'disable' message, we delete the outgoingMessagePort and disable the fetchEventListener
+            outgoingMessagePort = null;
+            fetchCaptureEnabled = false;
+        }
+    }
+    if (event.data.useCache) {
+        // Turns caching on or off (a string value of 'on' turns it on, any other string turns it off)
+        useCache = event.data.useCache === 'on';
+        if (useCache) CACHE = event.data.cacheName;
+        console.log('[SW] Caching was turned ' + event.data.useCache);
     }
-    if (event.data.action === 'disable') {
-        // On 'disable' message, we delete the outgoingMessagePort and disable the fetchEventListener
-        outgoingMessagePort = null;
-        fetchCaptureEnabled = false;
+    if (event.data.checkCache) {
+        // Checks and returns the caching strategy: checkCache key should contain a sample URL string to test
+        testCacheAndCountAssets(event.data.checkCache).then(function (cacheArr) {
+            event.ports[0].postMessage({ 'type': cacheArr[0], 'description': cacheArr[1], 'count': cacheArr[2] });
+        });
     }
 });
 
-// Pattern for ZIM file namespace - see https://wiki.openzim.org/wiki/ZIM_file_format#Namespaces
-// In our case, there is also the ZIM file name, used as a prefix in the URL
-var regexpZIMUrlWithNamespace = /(?:^|\/)([^\/]+\/)([-ABIJMUVWX])\/(.+)/;
+/**
+ * Handles fetch events that need to be extracted from the ZIM
+ * 
+ * @param {Event} fetchEvent The fetch event to be processed
+ * @returns {Promise} A Promise for the Response or the rejected invalid message port data
+ */
+function fetchRequestFromZIM(fetchEvent) {
+    return new Promise(function (resolve, reject) {
+        var nameSpace;
+        var title;
+        var titleWithNameSpace;
+        var regexpResult = regexpZIMUrlWithNamespace.exec(fetchEvent.request.url);
+        var prefix = regexpResult[1];
+        nameSpace = regexpResult[2];
+        title = regexpResult[3];
 
-function fetchEventListener(event) {
-    if (fetchCaptureEnabled) {
-        if (regexpZIMUrlWithNamespace.test(event.request.url)) {
-            // The ServiceWorker will handle this request
-            // Let's ask app.js for that content
-            event.respondWith(new Promise(function(resolve, reject) {
-                var nameSpace;
-                var title;
-                var titleWithNameSpace;
-                var regexpResult = regexpZIMUrlWithNamespace.exec(event.request.url);
-                var prefix = regexpResult[1];
-                nameSpace = regexpResult[2];
-                title = regexpResult[3];
-
-                // We need to remove the potential parameters in the URL
-                title = removeUrlParameters(decodeURIComponent(title));
-
-                titleWithNameSpace = nameSpace + '/' + title;
-
-                // Let's instanciate a new messageChannel, to allow app.s to give us the content
-                var messageChannel = new MessageChannel();
-                messageChannel.port1.onmessage = function(event) {
-                    if (event.data.action === 'giveContent') {
-                        // Content received from app.js
-                        var contentLength = event.data.content ? event.data.content.byteLength : null;
-                        var contentType = event.data.mimetype;
-                        var headers = new Headers ();
-                        if (contentLength) headers.set('Content-Length', contentLength);
-                        if (contentType) headers.set('Content-Type', contentType);
-                        // Test if the content is a video or audio file
-                        // See kiwix-js #519 and openzim/zimwriterfs #113 for why we test for invalid types like "mp4" or "webm" (without "video/")
-                        // The full list of types produced by zimwriterfs is in https://github.com/openzim/zimwriterfs/blob/master/src/tools.cpp
-                        if (contentLength >= 1 && /^(video|audio)|(^|\/)(mp4|webm|og[gmv]|mpeg)$/i.test(contentType)) {
-                            // In case of a video (at least), Chrome and Edge need these HTTP headers else seeking doesn't work
-                            // (even if we always send all the video content, not the requested range, until the backend supports it)
-                            headers.set('Accept-Ranges', 'bytes');
-                            headers.set('Content-Range', 'bytes 0-' + (contentLength-1) + '/' + contentLength);
-                        }
-                        var responseInit = {
-                            status: 200,
-                            statusText: 'OK',
-                            headers: headers
-                        };
-
-                        var httpResponse = new Response(event.data.content, responseInit);
-
-                        // Let's send the content back from the ServiceWorker
-                        resolve(httpResponse);
-                    }
-                    else if (event.data.action === 'sendRedirect') {
-                        resolve(Response.redirect(prefix + event.data.redirectUrl));
-                    }
-                    else {
-                        console.error('Invalid message received from app.js for ' + titleWithNameSpace, event.data);
-                        reject(event.data);
-                    }
+        // We need to remove the potential parameters in the URL
+        title = removeUrlParameters(decodeURIComponent(title));
+
+        titleWithNameSpace = nameSpace + '/' + title;
+
+        // Let's instantiate a new messageChannel, to allow app.js to give us the content
+        var messageChannel = new MessageChannel();
+        messageChannel.port1.onmessage = function (msgPortEvent) {
+            if (msgPortEvent.data.action === 'giveContent') {
+                // Content received from app.js
+                var contentLength = msgPortEvent.data.content ? msgPortEvent.data.content.byteLength : null;
+                var contentType = msgPortEvent.data.mimetype;
+                var headers = new Headers();
+                if (contentLength) headers.set('Content-Length', contentLength);
+                if (contentType) headers.set('Content-Type', contentType);
+                // Test if the content is a video or audio file
+                // See kiwix-js #519 and openzim/zimwriterfs #113 for why we test for invalid types like "mp4" or "webm" (without "video/")
+                // The full list of types produced by zimwriterfs is in https://github.com/openzim/zimwriterfs/blob/master/src/tools.cpp
+                if (contentLength >= 1 && /^(video|audio)|(^|\/)(mp4|webm|og[gmv]|mpeg)$/i.test(contentType)) {
+                    // In case of a video (at least), Chrome and Edge need these HTTP headers or else seeking doesn't work
+                    // (even if we always send all the video content, not the requested range, until the backend supports it)
+                    headers.set('Accept-Ranges', 'bytes');
+                    headers.set('Content-Range', 'bytes 0-' + (contentLength - 1) + '/' + contentLength);
+                }
+                var responseInit = {
+                    status: 200,
+                    statusText: 'OK',
+                    headers: headers
                 };
-                outgoingMessagePort.postMessage({'action': 'askForContent', 'title': titleWithNameSpace}, [messageChannel.port2]);
-            }));
-        }
-        // If event.respondWith() isn't called because this wasn't a request that we want to handle,
-        // then the default request/response behavior will automatically be used.
-    }
+
+                var httpResponse = new Response(msgPortEvent.data.content, responseInit);
+
+                // Let's send the content back from the ServiceWorker
+                resolve(httpResponse);
+            } else if (msgPortEvent.data.action === 'sendRedirect') {
+                resolve(Response.redirect(prefix + msgPortEvent.data.redirectUrl));
+            } else {
+                reject(msgPortEvent.data, titleWithNameSpace);
+            }
+        };
+        outgoingMessagePort.postMessage({
+            'action': 'askForContent',
+            'title': titleWithNameSpace
+        }, [messageChannel.port2]);
+    });
+}
+
+/**
+ * Removes parameters and anchors from a URL
+ * @param {type} url The URL to be processed
+ * @returns {String} The same URL without its parameters and anchors
+ */
+function removeUrlParameters(url) {
+    return url.replace(/([^?#]+)[?#].*$/, '$1');
+}
+
+/**
+ * Looks up a Request in CACHE and returns a Promise for the matched Response
+ * @param {Request} request The Request to fulfill from CACHE
+ * @returns {Response} The cached Response (as a Promise) 
+ */
+function fromCache(request) {
+    // Prevents use of Cache API if user has disabled it
+    if (!useCache) return Promise.reject('disabled');
+    return caches.open(CACHE).then(function (cache) {
+        return cache.match(request).then(function (matching) {
+            if (!matching || matching.status === 404) {
+                return Promise.reject("no-match");
+            }
+            console.log('[SW] Supplying ' + request.url + ' from CACHE...');
+            return matching;
+        });
+    });
 }
+
+/**
+ * Stores or updates in CACHE the given Request/Response pair
+ * @param {Request} request The original Request object
+ * @param {Response} response The Response received from the server/ZIM
+ * @returns {Promise} A Promise for the update action
+ */
+function updateCache(request, response) {
+    // Prevents use of Cache API if user has disabled it
+    if (!useCache) return Promise.resolve();
+    return caches.open(CACHE).then(function (cache) {
+        console.log('[SW] Adding ' + request.url + ' to CACHE');
+        return cache.put(request, response);
+    });
+}
+
+/**
+ * Tests the caching strategy available to this app and if it is Cache API, count the
+ * number of assets in CACHE
+ * @param {String} url A URL to test against excludedURLSchema
+ * @returns {Promise} A Promise that resolves with an array of format [cacheType, cacheDescription, assetCount]
+ */
+function testCacheAndCountAssets(url) {
+    if (regexpExcludedURLSchema.test(url)) return Promise.resolve(['custom', 'Custom', '-']);
+    if (!useCache) return Promise.resolve(['none', 'None', 0]);
+    return caches.open(CACHE).then(function (cache) {
+        return cache.keys().then(function (keys) {
+            return ['cacheAPI', 'Cache API', keys.length];
+        }).catch(function(err) {
+            return err;
+        });
+    }).catch(function(err) {
+        return err;
+    });
+}
diff --git a/www/index.html b/www/index.html
@@ -47,8 +47,8 @@
         <!-- Status indicators -->
         <div id="searchingArticles" style="display: none;" class="status">
             <div class="loader"></div>
-            <div id="cachingCSS" style="display: none;" class="message">
-                Caching styles...
+            <div id="cachingAssets" style="display: none;" class="message">
+                Caching assets...
             </div>
         </div>
         <section id="search-article" role="region">
@@ -233,6 +233,50 @@ <h3>Display settings</h3>
                         </div>
                     </div>
                     <br />
+                    <div class="container">
+                        <h3>Performance settings</h3>
+                        <div class="card card-warning" id="cacheSettingsDiv">
+                            <div class="card-header">Speed up archive access</div>
+                            <div class="card-body">
+                                <div class="row">
+                                    <div class="col-sm-6">
+                                        <div class="radio">
+                                            <p>Kiwix JS can speed up the display of articles by caching assets:</p>
+                                            <label>
+                                                <input type="radio" name="cachedAssetsMode" value="true"
+                                                    id="cachedAssetsModeRadioTrue" checked>
+                                                <strong>Cache assets</strong> (recommended)
+                                            </label>
+                                        </div>
+                                        <div class="radio">
+                                            <label>
+                                                <input type="radio" name="cachedAssetsMode" value="false"
+                                                    id="cachedAssetsModeRadioFalse">
+                                                <strong>Do not cache assets</strong> (empties caches: for low-memory
+                                                devices)
+                                            </label>
+                                        </div>
+                                    </div>
+                                    <div class="col-sm-6">
+                                        <div id="cacheStatusPanel" class="card card-footer" style="overflow: hidden">
+                                            <div>
+                                                <p><b>Cache status:</b></p>
+                                            </div>
+                                            <div class="row">
+                                                <div class="col-7">
+                                                    <p>Cache used: <b id="cacheUsed"></b></p>
+                                                </div>
+                                                <div class="col-5">
+                                                    <p>Assets: <b id="assetsCount"></b></p>
+                                                </div>
+                                            </div>
+                                        </div>
+                                    </div>
+                                </div>
+                            </div>
+                        </div>
+                    </div>
+                    <br />
                     <div class="container">
                         <h3>Expert settings</h3>
                         <div class="card card-danger" id="contentInjectionModeDiv">