TemEx: Template Extractor

TemEx: Template Extractor

This tool automatically extracts the template of a webpage. In order to identify the template, this tool (1) analyzes the webpages linked by the current webpage, and (2) identifies common HTML structures. The common HTML structure is the template.

Merlin
Additional files are visible only to premium users

manifest.json


{
  "manifest_version": 2,
  "name": "__MSG_extensionName__",
  "author": "Julián",
  "description": "__MSG_extensionDescription__",
  "version": "1.8.1",
  "icons": {
    "24": "icons/t3.png"
  },
  "permissions": [
    "notifications",
    "activeTab",
    "tabs",
    "webRequest",
    "webRequestBlocking"
  ],
  "background": {
    "scripts": [
      "background-scripts/background.js"
    ]
  },
  "browser_action": {
    "default_icon": "icons/t3.png",
    "default_title": "__MSG_extensionDescription__"
  },
  "content_scripts": [
    {
      "matches": [
        "<all_urls>"
      ],
      "run_at": "document_idle",
      "all_frames": false,
      "js": [
        "content-scripts/createNamespaces.js",
        "content-scripts/TemEx/loader/PageLoader.js",
        "content-scripts/TemEx/util/Hashtable.js",
        "content-scripts/TemEx/util/TreeSearch.js",
        "content-scripts/TemEx/misc/Misc.js",
        "content-scripts/TemEx/site/Link.js",
        "content-scripts/TemEx/site/Webpage.js",
        "content-scripts/TemEx/site/Website.js",
        "content-scripts/TemEx/algorithm/TemEx/Config.js",
        "content-scripts/TemEx/algorithm/TemEx/HierarchyLinks.js",
        "content-scripts/TemEx/algorithm/TemEx/Map.js",
        "content-scripts/TemEx/algorithm/TemEx/TemEx.js",
        "content-scripts/TemEx/TemplateExtractor.js",
        "content-scripts/browserOverlay.js"
      ]
    }
  ],
  "default_locale": "en"
}