package/package.json000644 0000001426 13220203761011564 0ustar00000000 000000 { "name": "normalize-url", "version": "2.0.1", "description": "Normalize a URL", "license": "MIT", "repository": "sindresorhus/normalize-url", "author": { "name": "Sindre Sorhus", "email": "sindresorhus@gmail.com", "url": "sindresorhus.com" }, "engines": { "node": ">=4" }, "scripts": { "test": "xo && ava" }, "files": [ "index.js" ], "keywords": [ "normalize", "url", "uri", "address", "string", "normalization", "normalisation", "query", "querystring", "unicode", "simplify", "strip", "trim", "canonical" ], "dependencies": { "prepend-http": "^2.0.0", "query-string": "^5.0.1", "sort-keys": "^2.0.0" }, "devDependencies": { "ava": "*", "xo": "*" } } package/index.js000644 0000007626 13220203636010754 0ustar00000000 000000 'use strict'; const url = require('url'); const punycode = require('punycode'); const queryString = require('query-string'); const prependHttp = require('prepend-http'); const sortKeys = require('sort-keys'); const DEFAULT_PORTS = { 'http:': 80, 'https:': 443, 'ftp:': 21 }; // Protocols that always contain a `//`` bit const slashedProtocol = { http: true, https: true, ftp: true, gopher: true, file: true, 'http:': true, 'https:': true, 'ftp:': true, 'gopher:': true, 'file:': true }; function testParameter(name, filters) { return filters.some(filter => filter instanceof RegExp ? filter.test(name) : filter === name); } module.exports = (str, opts) => { opts = Object.assign({ normalizeProtocol: true, normalizeHttps: false, stripFragment: true, stripWWW: true, removeQueryParameters: [/^utm_\w+/i], removeTrailingSlash: true, removeDirectoryIndex: false, sortQueryParameters: true }, opts); if (typeof str !== 'string') { throw new TypeError('Expected a string'); } const hasRelativeProtocol = str.startsWith('//'); // Prepend protocol str = prependHttp(str.trim()).replace(/^\/\//, 'http://'); const urlObj = url.parse(str); if (opts.normalizeHttps && urlObj.protocol === 'https:') { urlObj.protocol = 'http:'; } if (!urlObj.hostname && !urlObj.pathname) { throw new Error('Invalid URL'); } // Prevent these from being used by `url.format` delete urlObj.host; delete urlObj.query; // Remove fragment if (opts.stripFragment) { delete urlObj.hash; } // Remove default port const port = DEFAULT_PORTS[urlObj.protocol]; if (Number(urlObj.port) === port) { delete urlObj.port; } // Remove duplicate slashes if (urlObj.pathname) { urlObj.pathname = urlObj.pathname.replace(/\/{2,}/g, '/'); } // Decode URI octets if (urlObj.pathname) { urlObj.pathname = decodeURI(urlObj.pathname); } // Remove directory index if (opts.removeDirectoryIndex === true) { opts.removeDirectoryIndex = [/^index\.[a-z]+$/]; } if (Array.isArray(opts.removeDirectoryIndex) && opts.removeDirectoryIndex.length > 0) { let pathComponents = urlObj.pathname.split('/'); const lastComponent = pathComponents[pathComponents.length - 1]; if (testParameter(lastComponent, opts.removeDirectoryIndex)) { pathComponents = pathComponents.slice(0, pathComponents.length - 1); urlObj.pathname = pathComponents.slice(1).join('/') + '/'; } } // Resolve relative paths, but only for slashed protocols if (slashedProtocol[urlObj.protocol]) { const domain = urlObj.protocol + '//' + urlObj.hostname; const relative = url.resolve(domain, urlObj.pathname); urlObj.pathname = relative.replace(domain, ''); } if (urlObj.hostname) { // IDN to Unicode urlObj.hostname = punycode.toUnicode(urlObj.hostname).toLowerCase(); // Remove trailing dot urlObj.hostname = urlObj.hostname.replace(/\.$/, ''); // Remove `www.` if (opts.stripWWW) { urlObj.hostname = urlObj.hostname.replace(/^www\./, ''); } } // Remove URL with empty query string if (urlObj.search === '?') { delete urlObj.search; } const queryParameters = queryString.parse(urlObj.search); // Remove query unwanted parameters if (Array.isArray(opts.removeQueryParameters)) { for (const key in queryParameters) { if (testParameter(key, opts.removeQueryParameters)) { delete queryParameters[key]; } } } // Sort query parameters if (opts.sortQueryParameters) { urlObj.search = queryString.stringify(sortKeys(queryParameters)); } // Decode query parameters if (urlObj.search !== null) { urlObj.search = decodeURIComponent(urlObj.search); } // Take advantage of many of the Node `url` normalizations str = url.format(urlObj); // Remove ending `/` if (opts.removeTrailingSlash || urlObj.pathname === '/') { str = str.replace(/\/$/, ''); } // Restore relative protocol, if applicable if (hasRelativeProtocol && !opts.normalizeProtocol) { str = str.replace(/^http:\/\//, '//'); } return str; }; package/license000644 0000002125 13114064117010642 0ustar00000000 000000 MIT License Copyright (c) Sindre Sorhus (sindresorhus.com) Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions: The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software. THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. package/readme.md000644 0000007046 13210073373011064 0ustar00000000 000000 # normalize-url [![Build Status](https://travis-ci.org/sindresorhus/normalize-url.svg?branch=master)](https://travis-ci.org/sindresorhus/normalize-url) > [Normalize](https://en.wikipedia.org/wiki/URL_normalization) a URL Useful when you need to display, store, deduplicate, sort, compare, etc, URLs. ## Install ``` $ npm install normalize-url ``` ## Usage ```js const normalizeUrl = require('normalize-url'); normalizeUrl('sindresorhus.com'); //=> 'http://sindresorhus.com' normalizeUrl('HTTP://xn--xample-hva.com:80/?b=bar&a=foo'); //=> 'http://êxample.com/?a=foo&b=bar' ``` ## API ### normalizeUrl(url, [options]) #### url Type: `string` URL to normalize. #### options Type: `Object` ##### normalizeProtocol Type: `boolean`
Default: `true` Prepend `http:` to the URL if it's protocol-relative. ```js normalizeUrl('//sindresorhus.com:80/'); //=> 'http://sindresorhus.com' normalizeUrl('//sindresorhus.com:80/', {normalizeProtocol: false}); //=> '//sindresorhus.com' ``` ##### normalizeHttps Type: `boolean`
Default: `false` Normalize `https:` URLs to `http:`. ```js normalizeUrl('https://sindresorhus.com:80/'); //=> 'https://sindresorhus.com' normalizeUrl('https://sindresorhus.com:80/', {normalizeHttps: true}); //=> 'http://sindresorhus.com' ``` ##### stripFragment Type: `boolean`
Default: `true` Remove the fragment at the end of the URL. ```js normalizeUrl('sindresorhus.com/about.html#contact'); //=> 'http://sindresorhus.com/about.html' normalizeUrl('sindresorhus.com/about.html#contact', {stripFragment: false}); //=> 'http://sindresorhus.com/about.html#contact' ``` ##### stripWWW Type: `boolean`
Default: `true` Remove `www.` from the URL. ```js normalizeUrl('http://www.sindresorhus.com/about.html#contact'); //=> 'http://sindresorhus.com/about.html#contact' normalizeUrl('http://www.sindresorhus.com/about.html#contact', {stripWWW: false}); //=> 'http://www.sindresorhus.com/about.html#contact' ``` ##### removeQueryParameters Type: `Array`
Default: `[/^utm_\w+/i]` Remove query parameters that matches any of the provided strings or regexes. ```js normalizeUrl('www.sindresorhus.com?foo=bar&ref=test_ref', { removeQueryParameters: ['ref'] }); //=> 'http://sindresorhus.com/?foo=bar' ``` ##### removeTrailingSlash Type: `boolean`
Default: `true` Remove trailing slash. **Note:** Trailing slash is always removed if the URL doesn't have a pathname. ```js normalizeUrl('http://sindresorhus.com/redirect/'); //=> 'http://sindresorhus.com/redirect' normalizeUrl('http://sindresorhus.com/redirect/', {removeTrailingSlash: false}); //=> 'http://sindresorhus.com/redirect/' normalizeUrl('http://sindresorhus.com/', {removeTrailingSlash: false}); //=> 'http://sindresorhus.com' ``` ##### removeDirectoryIndex Type: `boolean` `Array`
Default: `false` Remove the default directory index file from path that matches any of the provided strings or regexes. When `true`, the regex `/^index\.[a-z]+$/` is used. ```js normalizeUrl('www.sindresorhus.com/foo/default.php', { removeDirectoryIndex: [/^default\.[a-z]+$/] }); //=> 'http://sindresorhus.com/foo' ``` ##### sortQueryParameters Type: `boolean`
Default: `true` Sort the query parameters alphabetically by key. ```js normalizeUrl('www.sindresorhus.com?b=two&a=one&c=three', { sortQueryParameters: false }); //=> 'http://sindresorhus.com/?b=two&a=one&c=three' ``` ## Related - [compare-urls](https://github.com/sindresorhus/compare-urls) - Compare URLs by first normalizing them ## License MIT © [Sindre Sorhus](https://sindresorhus.com)