pypa · pradyunsg · Jun 29, 2020 · May 23, 2020 · May 23, 2020 · Jun 18, 2020
diff --git a/news/8128.feature b/news/8128.feature
@@ -0,0 +1 @@
+Warn if package url is a vcs or an archive url with invalid scheme
diff --git a/src/pip/_internal/index/collector.py b/src/pip/_internal/index/collector.py
@@ -434,7 +434,8 @@ def _get_html_page(link, session=None):
     # Check for VCS schemes that do not support lookup as web pages.
     vcs_scheme = _match_vcs_scheme(url)
     if vcs_scheme:
-        logger.debug('Cannot look at %s URL %s', vcs_scheme, link)
+        logger.warning('Cannot look at %s URL %s because it does not support '
+                       'lookup as web pages.', vcs_scheme, link)
         return None
 
     # Tack index.html onto file:// URLs that point to directories
@@ -450,7 +451,7 @@ def _get_html_page(link, session=None):
     try:
         resp = _get_html_response(url, session=session)
     except _NotHTTP:
-        logger.debug(
+        logger.warning(
             'Skipping page %s because it looks like an archive, and cannot '
             'be checked by HEAD.', link,
         )

diff --git a/tests/unit/test_collector.py b/tests/unit/test_collector.py
@@ -74,6 +74,31 @@ def test_get_html_response_archive_to_http_scheme(url, content_type):
     assert ctx.value.args == (content_type, "HEAD")
 
 
+@pytest.mark.parametrize(
+    "url",
+    [
+        ("ftp://python.org/python-3.7.1.zip"),
+        ("file:///opt/data/pip-18.0.tar.gz"),
+    ],
+)
+def test_get_html_page_invalid_content_type_archive(caplog, url):
+    """`_get_html_page()` should warn if an archive URL is not HTML
+    and therefore cannot be used for a HEAD request.
+    """
+    caplog.set_level(logging.WARNING)
+    link = Link(url)
+
+    session = mock.Mock(PipSession)
+
+    assert _get_html_page(link, session=session) is None
+    assert ('pip._internal.index.collector',
+            logging.WARNING,
+            'Skipping page {} because it looks like an archive, and cannot '
+            'be checked by HEAD.'.format(
+                url)) \
+        in caplog.record_tuples
+
+
 @pytest.mark.parametrize(
     "url",
     [
@@ -463,15 +488,16 @@ def test_get_html_page_invalid_scheme(caplog, url, vcs_scheme):
 
     Only file:, http:, https:, and ftp: are allowed.
     """
-    with caplog.at_level(logging.DEBUG):
+    with caplog.at_level(logging.WARNING):
         page = _get_html_page(Link(url), session=mock.Mock(PipSession))
 
     assert page is None
     assert caplog.record_tuples == [
         (
             "pip._internal.index.collector",
-            logging.DEBUG,
-            "Cannot look at {} URL {}".format(vcs_scheme, url),
+            logging.WARNING,
+            "Cannot look at {} URL {} because it does not support "
+            "lookup as web pages.".format(vcs_scheme, url),
         ),
     ]
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1 @@
		Warn if package url is a vcs or an archive url with invalid scheme