pagestats.js 9.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276
  1. /*******************************************************************************
  2. ηMatrix - a browser extension to black/white list requests.
  3. Copyright (C) 2013-2019 Raymond Hill
  4. Copyright (C) 2019 Alessio Vanni
  5. This program is free software: you can redistribute it and/or modify
  6. it under the terms of the GNU General Public License as published by
  7. the Free Software Foundation, either version 3 of the License, or
  8. (at your option) any later version.
  9. This program is distributed in the hope that it will be useful,
  10. but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. GNU General Public License for more details.
  13. You should have received a copy of the GNU General Public License
  14. along with this program. If not, see {http://www.gnu.org/licenses/}.
  15. Home: https://libregit.org/heckyel/ematrix
  16. uMatrix Home: https://github.com/gorhill/uMatrix
  17. */
  18. 'use strict';
  19. /******************************************************************************/
  20. ηMatrix.pageStoreFactory = (function() {
  21. /******************************************************************************/
  22. var ηm = ηMatrix;
  23. /******************************************************************************/
  24. var BlockedCollapsibles = function() {
  25. this.boundPruneAsyncCallback = this.pruneAsyncCallback.bind(this);
  26. this.blocked = new Map();
  27. this.hash = 0;
  28. this.timer = null;
  29. };
  30. BlockedCollapsibles.prototype = {
  31. shelfLife: 10 * 1000,
  32. add: function(type, url, isSpecific) {
  33. if ( this.blocked.size === 0 ) { this.pruneAsync(); }
  34. var now = Date.now() / 1000 | 0;
  35. // The following "trick" is to encode the specifity into the lsb of the
  36. // time stamp so as to avoid to have to allocate a memory structure to
  37. // store both time stamp and specificity.
  38. if ( isSpecific ) {
  39. now |= 0x00000001;
  40. } else {
  41. now &= 0xFFFFFFFE;
  42. }
  43. this.blocked.set(type + ' ' + url, now);
  44. this.hash = now;
  45. },
  46. reset: function() {
  47. this.blocked.clear();
  48. this.hash = 0;
  49. if ( this.timer !== null ) {
  50. clearTimeout(this.timer);
  51. this.timer = null;
  52. }
  53. },
  54. pruneAsync: function() {
  55. if ( this.timer === null ) {
  56. this.timer = vAPI.setTimeout(
  57. this.boundPruneAsyncCallback,
  58. this.shelfLife * 2
  59. );
  60. }
  61. },
  62. pruneAsyncCallback: function() {
  63. this.timer = null;
  64. var obsolete = Date.now() - this.shelfLife;
  65. for ( var entry of this.blocked ) {
  66. if ( entry[1] <= obsolete ) {
  67. this.blocked.delete(entry[0]);
  68. }
  69. }
  70. if ( this.blocked.size !== 0 ) { this.pruneAsync(); }
  71. }
  72. };
  73. /******************************************************************************/
  74. // Ref: Given a URL, returns a (somewhat) unique 32-bit value
  75. // Based on: FNV32a
  76. // http://www.isthe.com/chongo/tech/comp/fnv/index.html#FNV-reference-source
  77. // The rest is custom, suited for uMatrix.
  78. var PageStore = function(tabContext) {
  79. this.hostnameTypeCells = new Map();
  80. this.domains = new Set();
  81. this.blockedCollapsibles = new BlockedCollapsibles();
  82. this.requestStats = ηm.requestStatsFactory();
  83. this.off = false;
  84. this.init(tabContext);
  85. };
  86. PageStore.prototype = {
  87. collapsibleTypes: new Set([ 'image' ]),
  88. pageStoreJunkyard: [],
  89. init: function(tabContext) {
  90. this.tabId = tabContext.tabId;
  91. this.rawUrl = tabContext.rawURL;
  92. this.pageUrl = tabContext.normalURL;
  93. this.pageHostname = tabContext.rootHostname;
  94. this.pageDomain = tabContext.rootDomain;
  95. this.title = '';
  96. this.hostnameTypeCells.clear();
  97. this.domains.clear();
  98. this.allHostnamesString = ' ';
  99. this.blockedCollapsibles.reset();
  100. this.requestStats.reset();
  101. this.distinctRequestCount = 0;
  102. this.perLoadAllowedRequestCount = 0;
  103. this.perLoadBlockedRequestCount = 0;
  104. this.has3pReferrer = false;
  105. this.hasMixedContent = false;
  106. this.hasNoscriptTags = false;
  107. this.hasWebWorkers = false;
  108. this.incinerationTimer = null;
  109. this.mtxContentModifiedTime = 0;
  110. this.mtxCountModifiedTime = 0;
  111. return this;
  112. },
  113. dispose: function() {
  114. this.rawUrl = '';
  115. this.pageUrl = '';
  116. this.pageHostname = '';
  117. this.pageDomain = '';
  118. this.title = '';
  119. this.hostnameTypeCells.clear();
  120. this.domains.clear();
  121. this.allHostnamesString = ' ';
  122. this.blockedCollapsibles.reset();
  123. if ( this.incinerationTimer !== null ) {
  124. clearTimeout(this.incinerationTimer);
  125. this.incinerationTimer = null;
  126. }
  127. if ( this.pageStoreJunkyard.length < 8 ) {
  128. this.pageStoreJunkyard.push(this);
  129. }
  130. },
  131. cacheBlockedCollapsible: function(type, url, specificity) {
  132. if ( this.collapsibleTypes.has(type) ) {
  133. this.blockedCollapsibles.add(
  134. type,
  135. url,
  136. specificity !== 0 && specificity < 5
  137. );
  138. }
  139. },
  140. lookupBlockedCollapsibles: function(request, response) {
  141. var tabContext = ηm.tabContextManager.lookup(this.tabId);
  142. if ( tabContext === null ) { return; }
  143. var collapseBlacklisted = ηm.userSettings.collapseBlacklisted,
  144. collapseBlocked = ηm.userSettings.collapseBlocked,
  145. entry;
  146. var blockedResources = response.blockedResources;
  147. if (
  148. Array.isArray(request.toFilter) &&
  149. request.toFilter.length !== 0
  150. ) {
  151. var roothn = tabContext.rootHostname,
  152. hnFromURI = ηm.URI.hostnameFromURI,
  153. tMatrix = ηm.tMatrix;
  154. for ( entry of request.toFilter ) {
  155. if ( tMatrix.mustBlock(roothn, hnFromURI(entry.url), entry.type) === false ) {
  156. continue;
  157. }
  158. blockedResources.push([
  159. entry.type + ' ' + entry.url,
  160. collapseBlocked ||
  161. collapseBlacklisted && tMatrix.specificityRegister !== 0 &&
  162. tMatrix.specificityRegister < 5
  163. ]);
  164. }
  165. }
  166. if ( this.blockedCollapsibles.hash === response.hash ) { return; }
  167. response.hash = this.blockedCollapsibles.hash;
  168. for ( entry of this.blockedCollapsibles.blocked ) {
  169. blockedResources.push([
  170. entry[0],
  171. collapseBlocked || collapseBlacklisted && (entry[1] & 1) !== 0
  172. ]);
  173. }
  174. },
  175. recordRequest: function(type, url, block) {
  176. if ( block !== false ) {
  177. this.perLoadBlockedRequestCount++;
  178. } else {
  179. this.perLoadAllowedRequestCount++;
  180. }
  181. // Store distinct network requests. This is used to:
  182. // - remember which hostname/type were seen
  183. // - count the number of distinct URLs for any given
  184. // hostname-type pair
  185. var hostname = ηm.URI.hostnameFromURI(url),
  186. key = hostname + ' ' + type,
  187. uids = this.hostnameTypeCells.get(key);
  188. if ( uids === undefined ) {
  189. this.hostnameTypeCells.set(key, (uids = new Set()));
  190. } else if ( uids.size > 99 ) {
  191. return;
  192. }
  193. var uid = this.uidFromURL(url);
  194. if ( uids.has(uid) ) { return; }
  195. uids.add(uid);
  196. // Count blocked/allowed requests
  197. this.requestStats.record(type, block);
  198. // https://github.com/gorhill/httpswitchboard/issues/306
  199. // If it is recorded locally, record globally
  200. ηm.requestStats.record(type, block);
  201. ηm.updateBadgeAsync(this.tabId);
  202. // this.distinctRequestCount++;
  203. this.mtxCountModifiedTime = Date.now();
  204. if ( this.domains.has(hostname) === false ) {
  205. this.domains.add(hostname);
  206. this.allHostnamesString += hostname + ' ';
  207. this.mtxContentModifiedTime = Date.now();
  208. }
  209. },
  210. uidFromURL: function(uri) {
  211. var hint = 0x811c9dc5,
  212. i = uri.length;
  213. while ( i-- ) {
  214. hint ^= uri.charCodeAt(i) | 0;
  215. hint += (hint<<1) + (hint<<4) + (hint<<7) + (hint<<8) + (hint<<24) | 0;
  216. hint >>>= 0;
  217. }
  218. return hint;
  219. }
  220. };
  221. /******************************************************************************/
  222. return function pageStoreFactory(tabContext) {
  223. var entry = PageStore.prototype.pageStoreJunkyard.pop();
  224. if ( entry ) {
  225. return entry.init(tabContext);
  226. }
  227. return new PageStore(tabContext);
  228. };
  229. /******************************************************************************/
  230. })();
  231. /******************************************************************************/