Skip to content

Commit

Permalink
Redact basic authentication passwords from log messages (#5773)
Browse files Browse the repository at this point in the history
Redact basic authentication passwords from URLs.
  • Loading branch information
orf authored and cjerdonek committed Oct 19, 2018
1 parent c30b10a commit 78371cc
Show file tree
Hide file tree
Showing 8 changed files with 84 additions and 21 deletions.
1 change: 1 addition & 0 deletions news/4746.bugfix
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
Redact the password from the URL in various log messages.
6 changes: 3 additions & 3 deletions src/pip/_internal/index.py
Original file line number Diff line number Diff line change
Expand Up @@ -35,7 +35,7 @@
from pip._internal.utils.logging import indent_log
from pip._internal.utils.misc import (
ARCHIVE_EXTENSIONS, SUPPORTED_EXTENSIONS, normalize_path,
remove_auth_from_url,
redact_password_from_url,
)
from pip._internal.utils.packaging import check_requires_python
from pip._internal.wheel import Wheel, wheel_ext
Expand Down Expand Up @@ -326,7 +326,7 @@ def get_formatted_locations(self):
if self.index_urls and self.index_urls != [PyPI.simple_url]:
lines.append(
"Looking in indexes: {}".format(", ".join(
remove_auth_from_url(url) for url in self.index_urls))
redact_password_from_url(url) for url in self.index_urls))
)
if self.find_links:
lines.append(
Expand Down Expand Up @@ -923,7 +923,7 @@ def __init__(self, content, url, headers=None):
self.headers = headers

def __str__(self):
return self.url
return redact_password_from_url(self.url)

def iter_links(self):
"""Yields all links in the page"""
Expand Down
7 changes: 4 additions & 3 deletions src/pip/_internal/models/link.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,7 @@
from pip._vendor.six.moves.urllib import parse as urllib_parse

from pip._internal.download import path_to_url
from pip._internal.utils.misc import splitext
from pip._internal.utils.misc import redact_password_from_url, splitext
from pip._internal.utils.models import KeyBasedCompareMixin
from pip._internal.wheel import wheel_ext

Expand Down Expand Up @@ -44,9 +44,10 @@ def __str__(self):
else:
rp = ''
if self.comes_from:
return '%s (from %s)%s' % (self.url, self.comes_from, rp)
return '%s (from %s)%s' % (redact_password_from_url(self.url),
self.comes_from, rp)
else:
return str(self.url)
return redact_password_from_url(str(self.url))

def __repr__(self):
return '<Link %s>' % self
Expand Down
6 changes: 3 additions & 3 deletions src/pip/_internal/req/req_install.py
Original file line number Diff line number Diff line change
Expand Up @@ -30,7 +30,7 @@
from pip._internal.utils.misc import (
_make_build_dir, ask_path_exists, backup_dir, call_subprocess,
display_path, dist_in_site_packages, dist_in_usersite, ensure_dir,
get_installed_version, rmtree,
get_installed_version, redact_password_from_url, rmtree,
)
from pip._internal.utils.packaging import get_metadata
from pip._internal.utils.setuptools_build import SETUPTOOLS_SHIM
Expand Down Expand Up @@ -128,9 +128,9 @@ def __str__(self):
if self.req:
s = str(self.req)
if self.link:
s += ' from %s' % self.link.url
s += ' from %s' % redact_password_from_url(self.link.url)
elif self.link:
s = self.link.url
s = redact_password_from_url(self.link.url)
else:
s = '<InstallRequirement>'
if self.satisfied_by is not None:
Expand Down
39 changes: 32 additions & 7 deletions src/pip/_internal/utils/misc.py
Original file line number Diff line number Diff line change
Expand Up @@ -890,15 +890,24 @@ def split_auth_from_netloc(netloc):
return netloc, user_pass


def remove_auth_from_url(url):
# Return a copy of url with 'username:password@' removed.
# username/pass params are passed to subversion through flags
# and are not recognized in the url.
def redact_netloc(netloc):
"""
Replace the password in a netloc with "****", if it exists.
For example, "user:[email protected]" returns "user:****@example.com".
"""
netloc, (user, password) = split_auth_from_netloc(netloc)
if user is None:
return netloc
password = '' if password is None else ':****'
return '{user}{password}@{netloc}'.format(user=user,
password=password,
netloc=netloc)

# parsed url
purl = urllib_parse.urlsplit(url)
netloc, user_pass = split_auth_from_netloc(purl.netloc)

def _transform_url(url, transform_netloc):
purl = urllib_parse.urlsplit(url)
netloc = transform_netloc(purl.netloc)
# stripped url
url_pieces = (
purl.scheme, netloc, purl.path, purl.query, purl.fragment
Expand All @@ -907,6 +916,22 @@ def remove_auth_from_url(url):
return surl


def _get_netloc(netloc):
return split_auth_from_netloc(netloc)[0]


def remove_auth_from_url(url):
# Return a copy of url with 'username:password@' removed.
# username/pass params are passed to subversion through flags
# and are not recognized in the url.
return _transform_url(url, _get_netloc)


def redact_password_from_url(url):
"""Replace the password in a given url with ****."""
return _transform_url(url, redact_netloc)


def protect_pip_from_modification_on_windows(modifying_pip):
"""Protection of pip.exe from modification on Windows
Expand Down
7 changes: 5 additions & 2 deletions src/pip/_internal/vcs/git.py
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,9 @@

from pip._internal.exceptions import BadCommand
from pip._internal.utils.compat import samefile
from pip._internal.utils.misc import display_path, make_vcs_requirement_url
from pip._internal.utils.misc import (
display_path, make_vcs_requirement_url, redact_password_from_url,
)
from pip._internal.utils.temp_dir import TempDirectory
from pip._internal.vcs import VersionControl, vcs

Expand Down Expand Up @@ -193,7 +195,8 @@ def is_commit_id_equal(self, dest, name):
def fetch_new(self, dest, url, rev_options):
rev_display = rev_options.to_display()
logger.info(
'Cloning %s%s to %s', url, rev_display, display_path(dest),
'Cloning %s%s to %s', redact_password_from_url(url),
rev_display, display_path(dest),
)
self.run_command(['clone', '-q', url, dest])

Expand Down
4 changes: 3 additions & 1 deletion tests/unit/test_index.py
Original file line number Diff line number Diff line change
Expand Up @@ -161,7 +161,9 @@ def test_get_formatted_locations_basic_auth():
finder = PackageFinder([], index_urls, session=[])

result = finder.get_formatted_locations()
assert 'user' not in result and 'pass' not in result
assert 'user' in result
assert '****' in result
assert 'pass' not in result


@pytest.mark.parametrize(
Expand Down
35 changes: 33 additions & 2 deletions tests/unit/test_utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -24,8 +24,9 @@
from pip._internal.utils.hashes import Hashes, MissingHashes
from pip._internal.utils.misc import (
call_subprocess, egg_link_path, ensure_dir, get_installed_distributions,
get_prog, make_vcs_requirement_url, normalize_path, remove_auth_from_url,
rmtree, split_auth_from_netloc, untar_file, unzip_file,
get_prog, make_vcs_requirement_url, normalize_path, redact_netloc,
redact_password_from_url, remove_auth_from_url, rmtree,
split_auth_from_netloc, untar_file, unzip_file,
)
from pip._internal.utils.packaging import check_dist_requires_python
from pip._internal.utils.temp_dir import TempDirectory
Expand Down Expand Up @@ -662,6 +663,25 @@ def test_split_auth_from_netloc(netloc, expected):
assert actual == expected


@pytest.mark.parametrize('netloc, expected', [
# Test a basic case.
('example.com', 'example.com'),
# Test with username and no password.
('[email protected]', '[email protected]'),
# Test with username and password.
('user:[email protected]', 'user:****@example.com'),
# Test with username and empty password.
('user:@example.com', 'user:****@example.com'),
# Test the password containing an @ symbol.
('user:pass@[email protected]', 'user:****@example.com'),
# Test the password containing a : symbol.
('user:pass:[email protected]', 'user:****@example.com'),
])
def test_redact_netloc(netloc, expected):
actual = redact_netloc(netloc)
assert actual == expected


@pytest.mark.parametrize('auth_url, expected_url', [
('https://user:[email protected]/project/tags/v0.2',
'https://domain.tld/project/tags/v0.2'),
Expand All @@ -681,3 +701,14 @@ def test_split_auth_from_netloc(netloc, expected):
def test_remove_auth_from_url(auth_url, expected_url):
url = remove_auth_from_url(auth_url)
assert url == expected_url


@pytest.mark.parametrize('auth_url, expected_url', [
('https://[email protected]/abc', 'https://[email protected]/abc'),
('https://user:[email protected]', 'https://user:****@example.com'),
('https://user:@example.com', 'https://user:****@example.com'),
('https://example.com', 'https://example.com')
])
def test_redact_password_from_url(auth_url, expected_url):
url = redact_password_from_url(auth_url)
assert url == expected_url

0 comments on commit 78371cc

Please sign in to comment.