# vim: ft=python fileencoding=utf-8 sts=4 sw=4 et: # Copyright 2014-2016 Florian Bruhin (The Compiler) # # This file is part of qutebrowser. # # qutebrowser is free software: you can redistribute it and/or modify # it under the terms of the GNU General Public License as published by # the Free Software Foundation, either version 3 of the License, or # (at your option) any later version. # # qutebrowser is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU General Public License for more details. # # You should have received a copy of the GNU General Public License # along with qutebrowser. If not, see . """Tests for qutebrowser.utils.urlutils.""" import os.path import collections from PyQt5.QtCore import QUrl import pytest from qutebrowser.commands import cmdexc from qutebrowser.utils import utils, urlutils, qtutils class FakeDNS: """Helper class for the fake_dns fixture. Class attributes: FakeDNSAnswer: Helper class/namedtuple imitating a QHostInfo object (used by fromname_mock). Attributes: used: Whether the fake DNS server was used since it was created/reset. answer: What to return for the given host(True/False). Needs to be set when fromname_mock is called. """ FakeDNSAnswer = collections.namedtuple('FakeDNSAnswer', ['error']) def __init__(self): self.used = False self.answer = None def __repr__(self): return utils.get_repr(self, used=self.used, answer=self.answer) def reset(self): """Reset used/answer as if the FakeDNS was freshly created.""" self.used = False self.answer = None def _get_error(self): return not self.answer def fromname_mock(self, _host): """Simple mock for QHostInfo::fromName returning a FakeDNSAnswer.""" if self.answer is None: raise ValueError("Got called without answer being set. This means " "something tried to make an unexpected DNS " "request (QHostInfo::fromName).") if self.used: raise ValueError("Got used twice!.") self.used = True return self.FakeDNSAnswer(error=self._get_error) @pytest.fixture(autouse=True) def fake_dns(monkeypatch): """Patched QHostInfo.fromName to catch DNS requests. With autouse=True so accidental DNS requests get discovered because the fromname_mock will be called without answer being set. """ dns = FakeDNS() monkeypatch.setattr('qutebrowser.utils.urlutils.QHostInfo.fromName', dns.fromname_mock) return dns @pytest.fixture(autouse=True) def urlutils_config_stub(config_stub, monkeypatch): """Initialize the given config_stub. Args: stub: The ConfigStub provided by the config_stub fixture. auto_search: The value auto-search should have. """ config_stub.data = { 'general': {'auto-search': True}, 'searchengines': { 'test': 'http://www.qutebrowser.org/?q={}', 'test-with-dash': 'http://www.example.org/?q={}', 'DEFAULT': 'http://www.example.com/?q={}', }, } monkeypatch.setattr('qutebrowser.utils.urlutils.config', config_stub) return config_stub @pytest.fixture def urlutils_message_mock(message_mock): """Customized message_mock for the urlutils module.""" message_mock.patch('qutebrowser.utils.urlutils.message') return message_mock class TestFuzzyUrl: """Tests for urlutils.fuzzy_url().""" @pytest.fixture def os_mock(self, mocker): """Mock the os module and some os.path functions.""" m = mocker.patch('qutebrowser.utils.urlutils.os') # Using / to get the same behavior across OS' m.path.join.side_effect = lambda *args: '/'.join(args) m.path.expanduser.side_effect = os.path.expanduser return m @pytest.fixture def is_url_mock(self, mocker): return mocker.patch('qutebrowser.utils.urlutils.is_url') @pytest.fixture def get_search_url_mock(self, mocker): return mocker.patch('qutebrowser.utils.urlutils._get_search_url') def test_file_relative_cwd(self, os_mock): """Test with relative=True, cwd set, and an existing file.""" os_mock.path.exists.return_value = True os_mock.path.isabs.return_value = False url = urlutils.fuzzy_url('foo', cwd='cwd', relative=True) os_mock.path.exists.assert_called_once_with('cwd/foo') assert url == QUrl('file:cwd/foo') def test_file_relative(self, os_mock): """Test with relative=True and cwd unset.""" os_mock.path.exists.return_value = True os_mock.path.abspath.return_value = 'abs_path' os_mock.path.isabs.return_value = False url = urlutils.fuzzy_url('foo', relative=True) os_mock.path.exists.assert_called_once_with('abs_path') assert url == QUrl('file:abs_path') def test_file_relative_os_error(self, os_mock, is_url_mock): """Test with relative=True, cwd unset and abspath raising OSError.""" os_mock.path.abspath.side_effect = OSError os_mock.path.exists.return_value = True os_mock.path.isabs.return_value = False is_url_mock.return_value = True url = urlutils.fuzzy_url('foo', relative=True) assert not os_mock.path.exists.called assert url == QUrl('http://foo') @pytest.mark.parametrize('path, expected', [ ('/foo', QUrl('file:///foo')), ('/bar\n', QUrl('file:///bar')), ]) def test_file_absolute(self, path, expected, os_mock): """Test with an absolute path.""" os_mock.path.exists.return_value = True os_mock.path.isabs.return_value = True url = urlutils.fuzzy_url(path) assert url == expected @pytest.mark.posix def test_file_absolute_expanded(self, os_mock): """Make sure ~ gets expanded correctly.""" os_mock.path.exists.return_value = True os_mock.path.isabs.return_value = True url = urlutils.fuzzy_url('~/foo') assert url == QUrl('file://' + os.path.expanduser('~/foo')) def test_address(self, os_mock, is_url_mock): """Test passing something with relative=False.""" os_mock.path.isabs.return_value = False is_url_mock.return_value = True url = urlutils.fuzzy_url('foo') assert url == QUrl('http://foo') def test_search_term(self, os_mock, is_url_mock, get_search_url_mock): """Test passing something with do_search=True.""" os_mock.path.isabs.return_value = False is_url_mock.return_value = False get_search_url_mock.return_value = QUrl('search_url') url = urlutils.fuzzy_url('foo', do_search=True) assert url == QUrl('search_url') def test_search_term_value_error(self, os_mock, is_url_mock, get_search_url_mock): """Test with do_search=True and ValueError in _get_search_url.""" os_mock.path.isabs.return_value = False is_url_mock.return_value = False get_search_url_mock.side_effect = ValueError url = urlutils.fuzzy_url('foo', do_search=True) assert url == QUrl('http://foo') def test_no_do_search(self, is_url_mock): """Test with do_search = False.""" is_url_mock.return_value = False url = urlutils.fuzzy_url('foo', do_search=False) assert url == QUrl('http://foo') @pytest.mark.parametrize('do_search, exception', [ (True, qtutils.QtValueError), (False, urlutils.InvalidUrlError), ]) def test_invalid_url(self, do_search, exception, is_url_mock, monkeypatch): """Test with an invalid URL.""" is_url_mock.return_value = True monkeypatch.setattr('qutebrowser.utils.urlutils.qurl_from_user_input', lambda url: QUrl()) with pytest.raises(exception): urlutils.fuzzy_url('foo', do_search=do_search) @pytest.mark.parametrize('url', ['', ' ']) def test_empty(self, url): with pytest.raises(urlutils.InvalidUrlError): urlutils.fuzzy_url(url, do_search=True) @pytest.mark.parametrize('urlstring', [ 'http://www.qutebrowser.org/', '/foo', 'test' ]) def test_force_search(self, urlstring, get_search_url_mock): """Test the force search option.""" get_search_url_mock.return_value = QUrl('search_url') url = urlutils.fuzzy_url(urlstring, force_search=True) assert url == QUrl('search_url') @pytest.mark.parametrize('path, check_exists', [ ('/foo', False), ('/bar', True), ]) def test_get_path_existing(self, path, check_exists, os_mock): """Test with an absolute path.""" os_mock.path.exists.return_value = False expected = None if check_exists else path url = urlutils.get_path_if_valid(path, check_exists=check_exists) assert url == expected @pytest.mark.parametrize('url, special', [ ('file:///tmp/foo', True), ('about:blank', True), ('qute:version', True), ('http://www.qutebrowser.org/', False), ('www.qutebrowser.org', False), ]) def test_special_urls(url, special): assert urlutils.is_special_url(QUrl(url)) == special @pytest.mark.parametrize('url, host, query', [ ('testfoo', 'www.example.com', 'q=testfoo'), ('test testfoo', 'www.qutebrowser.org', 'q=testfoo'), ('test testfoo bar foo', 'www.qutebrowser.org', 'q=testfoo bar foo'), ('test testfoo ', 'www.qutebrowser.org', 'q=testfoo'), ('!python testfoo', 'www.example.com', 'q=%21python testfoo'), ('blub testfoo', 'www.example.com', 'q=blub testfoo'), ('stripped ', 'www.example.com', 'q=stripped'), ('test-with-dash testfoo', 'www.example.org', 'q=testfoo'), ]) def test_get_search_url(urlutils_config_stub, url, host, query): """Test _get_search_url(). Args: url: The "URL" to enter. host: The expected search machine host. query: The expected search query. """ url = urlutils._get_search_url(url) assert url.host() == host assert url.query() == query @pytest.mark.parametrize('url', ['\n', ' ', '\n ']) def test_get_search_url_invalid(urlutils_config_stub, url): with pytest.raises(ValueError): urlutils._get_search_url(url) @pytest.mark.parametrize('is_url, is_url_no_autosearch, uses_dns, url', [ # Normal hosts (True, True, False, 'http://foobar'), (True, True, False, 'localhost:8080'), (True, True, True, 'qutebrowser.org'), (True, True, True, ' qutebrowser.org '), (True, True, False, 'http://user:password@example.com/foo?bar=baz#fish'), # IPs (True, True, False, '127.0.0.1'), (True, True, False, '::1'), (True, True, True, '2001:41d0:2:6c11::1'), (True, True, True, '94.23.233.17'), # Special URLs (True, True, False, 'file:///tmp/foo'), (True, True, False, 'about:blank'), (True, True, False, 'qute:version'), (True, True, False, 'localhost'), # _has_explicit_scheme False, special_url True (True, True, False, 'qute::foo'), # Invalid URLs (False, False, False, ''), (False, True, False, 'onlyscheme:'), (False, True, False, 'http:foo:0'), # Not URLs (False, True, False, 'foo bar'), # no DNS because of space (False, True, False, 'localhost test'), # no DNS because of space (False, True, False, 'another . test'), # no DNS because of space (False, True, True, 'foo'), (False, True, False, 'this is: not an URL'), # no DNS because of space (False, True, False, '23.42'), # no DNS because bogus-IP (False, True, False, '1337'), # no DNS because bogus-IP (False, True, True, 'deadbeef'), (False, True, False, '31c3'), # no DNS because bogus-IP (False, True, False, 'foo::bar'), # no DNS because of no host # Valid search term with autosearch (False, False, False, 'test foo'), # autosearch = False (False, True, False, 'This is an URL without autosearch'), ]) def test_is_url(urlutils_config_stub, fake_dns, is_url, is_url_no_autosearch, uses_dns, url): """Test is_url(). Args: is_url: Whether the given string is an URL with auto-search dns/naive. is_url_no_autosearch: Whether the given string is an URL with auto-search false. uses_dns: Whether the given string should fire a DNS request for the given URL. url: The URL to test, as a string. """ urlutils_config_stub.data['general']['auto-search'] = 'dns' if uses_dns: fake_dns.answer = True result = urlutils.is_url(url) assert fake_dns.used assert result fake_dns.reset() fake_dns.answer = False result = urlutils.is_url(url) assert fake_dns.used assert not result else: result = urlutils.is_url(url) assert not fake_dns.used assert result == is_url fake_dns.reset() urlutils_config_stub.data['general']['auto-search'] = 'naive' assert urlutils.is_url(url) == is_url assert not fake_dns.used fake_dns.reset() urlutils_config_stub.data['general']['auto-search'] = False assert urlutils.is_url(url) == is_url_no_autosearch assert not fake_dns.used @pytest.mark.parametrize('user_input, output', [ ('qutebrowser.org', 'http://qutebrowser.org'), ('http://qutebrowser.org', 'http://qutebrowser.org'), ('::1/foo', 'http://[::1]/foo'), ('[::1]/foo', 'http://[::1]/foo'), ('http://[::1]', 'http://[::1]'), ('qutebrowser.org', 'http://qutebrowser.org'), ('http://qutebrowser.org', 'http://qutebrowser.org'), ('::1/foo', 'http://[::1]/foo'), ('[::1]/foo', 'http://[::1]/foo'), ('http://[::1]', 'http://[::1]'), ]) def test_qurl_from_user_input(user_input, output): """Test qurl_from_user_input. Args: user_input: The string to pass to qurl_from_user_input. output: The expected QUrl string. """ url = urlutils.qurl_from_user_input(user_input) assert url.toString() == output @pytest.mark.parametrize('url, valid, has_err_string', [ ('http://www.example.com/', True, False), ('', False, False), ('://', False, True), ]) def test_invalid_url_error(urlutils_message_mock, url, valid, has_err_string): """Test invalid_url_error(). Args: url: The URL to check. valid: Whether the QUrl is valid (isValid() == True). has_err_string: Whether the QUrl is expected to have errorString set. """ qurl = QUrl(url) assert qurl.isValid() == valid if valid: with pytest.raises(ValueError): urlutils.invalid_url_error(0, qurl, '') assert not urlutils_message_mock.messages else: assert bool(qurl.errorString()) == has_err_string urlutils.invalid_url_error(0, qurl, 'frozzle') msg = urlutils_message_mock.getmsg(urlutils_message_mock.Level.error) if has_err_string: expected_text = ("Trying to frozzle with invalid URL - " + qurl.errorString()) else: expected_text = "Trying to frozzle with invalid URL" assert msg.text == expected_text @pytest.mark.parametrize('url, valid, has_err_string', [ ('http://www.example.com/', True, False), ('', False, False), ('://', False, True), ]) def test_raise_cmdexc_if_invalid(url, valid, has_err_string): """Test raise_cmdexc_if_invalid. Args: url: The URL to check. valid: Whether the QUrl is valid (isValid() == True). has_err_string: Whether the QUrl is expected to have errorString set. """ qurl = QUrl(url) assert qurl.isValid() == valid if valid: urlutils.raise_cmdexc_if_invalid(qurl) else: assert bool(qurl.errorString()) == has_err_string with pytest.raises(cmdexc.CommandError) as excinfo: urlutils.raise_cmdexc_if_invalid(qurl) if has_err_string: expected_text = "Invalid URL - " + qurl.errorString() else: expected_text = "Invalid URL" assert str(excinfo.value) == expected_text @pytest.mark.parametrize('qurl, output', [ (QUrl(), None), (QUrl('http://qutebrowser.org/test.html'), 'test.html'), (QUrl('http://qutebrowser.org/foo.html#bar'), 'foo.html'), (QUrl('http://user:password@qutebrowser.org/foo?bar=baz#fish'), 'foo'), (QUrl('http://qutebrowser.org/'), 'qutebrowser.org.html'), (QUrl('qute://'), None), ]) def test_filename_from_url(qurl, output): assert urlutils.filename_from_url(qurl) == output @pytest.mark.parametrize('qurl, tpl', [ (QUrl(), None), (QUrl('qute://'), None), (QUrl('qute://foobar'), None), (QUrl('mailto:nobody'), None), (QUrl('ftp://example.com/'), ('ftp', 'example.com', 21)), (QUrl('ftp://example.com:2121/'), ('ftp', 'example.com', 2121)), (QUrl('http://qutebrowser.org:8010/waterfall'), ('http', 'qutebrowser.org', 8010)), (QUrl('https://example.com/'), ('https', 'example.com', 443)), (QUrl('https://example.com:4343/'), ('https', 'example.com', 4343)), (QUrl('http://user:password@qutebrowser.org/foo?bar=baz#fish'), ('http', 'qutebrowser.org', 80)), ]) def test_host_tuple(qurl, tpl): """Test host_tuple(). Args: qurl: The QUrl to pass. tpl: The expected tuple, or None if a ValueError is expected. """ if tpl is None: with pytest.raises(ValueError): urlutils.host_tuple(qurl) else: assert urlutils.host_tuple(qurl) == tpl class TestInvalidUrlError: @pytest.mark.parametrize('url, raising, has_err_string', [ (QUrl(), False, False), (QUrl('http://www.example.com/'), True, False), (QUrl('://'), False, True), ]) def test_invalid_url_error(self, url, raising, has_err_string): """Test InvalidUrlError. Args: url: The URL to pass to InvalidUrlError. raising; True if the InvalidUrlError should raise itself. has_err_string: Whether the QUrl is expected to have errorString set. """ if raising: expected_exc = ValueError else: expected_exc = urlutils.InvalidUrlError with pytest.raises(expected_exc) as excinfo: raise urlutils.InvalidUrlError(url) if not raising: expected_text = "Invalid URL" if has_err_string: expected_text += " - " + url.errorString() assert str(excinfo.value) == expected_text def test_value_error_subclass(self): """Make sure InvalidUrlError is a ValueError subclass.""" with pytest.raises(ValueError): raise urlutils.InvalidUrlError(QUrl()) @pytest.mark.parametrize('are_same, url1, url2', [ (True, 'http://example.com', 'http://www.example.com'), (True, 'http://bbc.co.uk', 'https://www.bbc.co.uk'), (True, 'http://many.levels.of.domains.example.com', 'http://www.example.com'), (True, 'http://idn.иком.museum', 'http://idn2.иком.museum'), (True, 'http://one.not_a_valid_tld', 'http://one.not_a_valid_tld'), (False, 'http://bbc.co.uk', 'http://example.co.uk'), (False, 'https://example.kids.museum', 'http://example.kunst.museum'), (False, 'http://idn.иком.museum', 'http://idn.ירושלים.museum'), (False, 'http://one.not_a_valid_tld', 'http://two.not_a_valid_tld'), ]) def test_same_domain(are_same, url1, url2): """Test same_domain.""" assert urlutils.same_domain(QUrl(url1), QUrl(url2)) == are_same assert urlutils.same_domain(QUrl(url2), QUrl(url1)) == are_same @pytest.mark.parametrize('url1, url2', [ ('http://example.com', ''), ('', 'http://example.com'), ]) def test_same_domain_invalid_url(url1, url2): """Test same_domain with invalid URLs.""" with pytest.raises(urlutils.InvalidUrlError): urlutils.same_domain(QUrl(url1), QUrl(url2)) @pytest.mark.parametrize('url, expected', [ ('http://example.com', 'http://example.com'), ('http://ünicode.com', 'http://xn--nicode-2ya.com'), ('http://foo.bar/?header=text/pläin', 'http://foo.bar/?header=text/pl%C3%A4in'), ]) def test_encoded_url(url, expected): url = QUrl(url) assert urlutils.encoded_url(url) == expected class TestIncDecNumber: """Tests for urlutils.incdec_number().""" @pytest.mark.parametrize('incdec', ['increment', 'decrement']) @pytest.mark.parametrize('value', [ '{}foo', 'foo{}', 'foo{}bar', '42foo{}' ]) @pytest.mark.parametrize('url', [ 'http://example.com:80/v1/path/{}/test', 'http://example.com:80/v1/query_test?value={}', 'http://example.com:80/v1/anchor_test#{}', 'http://host_{}_test.com:80', 'http://m4ny.c0m:80/number5/3very?where=yes#{}' ]) def test_incdec_number(self, incdec, value, url): """Test incdec_number with valid URLs.""" # The integer used should not affect test output, as long as it's # bigger than 1 # 20 was chosen by dice roll, guaranteed to be random base_value = value.format(20) if incdec == 'increment': expected_value = value.format(21) else: expected_value = value.format(19) base_url = QUrl(url.format(base_value)) expected_url = QUrl(url.format(expected_value)) new_url = urlutils.incdec_number( base_url, incdec, segments={'host', 'path', 'query', 'anchor'}) assert new_url == expected_url @pytest.mark.parametrize('number, expected, incdec', [ ('01', '02', 'increment'), ('09', '10', 'increment'), ('009', '010', 'increment'), ('02', '01', 'decrement'), ('10', '9', 'decrement'), ('010', '009', 'decrement') ]) def test_incdec_leading_zeroes(self, number, expected, incdec): """Test incdec_number with leading zeroes.""" url = 'http://example.com/{}' base_url = QUrl(url.format(number)) expected_url = QUrl(url.format(expected)) new_url = urlutils.incdec_number(base_url, incdec, segments={'path'}) assert new_url == expected_url @pytest.mark.parametrize('url, segments, expected', [ ('http://ex4mple.com/test_4?page=3#anchor2', {'host'}, 'http://ex5mple.com/test_4?page=3#anchor2'), ('http://ex4mple.com/test_4?page=3#anchor2', {'host', 'path'}, 'http://ex4mple.com/test_5?page=3#anchor2'), ('http://ex4mple.com/test_4?page=3#anchor5', {'host', 'path', 'query'}, 'http://ex4mple.com/test_4?page=4#anchor5'), ]) def test_incdec_segment_ignored(self, url, segments, expected): new_url = urlutils.incdec_number(QUrl(url), 'increment', segments=segments) assert new_url == QUrl(expected) @pytest.mark.parametrize('url', [ "http://example.com/long/path/but/no/number", "http://ex4mple.com/number/in/hostname", "http://example.com:42/number/in/port", "http://www2.example.com/number/in/subdomain", "http://example.com/%C3%B6/urlencoded/data", "http://example.com/number/in/anchor#5", "http://www2.ex4mple.com:42/all/of/the/%C3%A4bove#5", ]) def test_no_number(self, url): """Test incdec_number with URLs that don't contain a number.""" with pytest.raises(urlutils.IncDecError): urlutils.incdec_number(QUrl(url), "increment") def test_number_below_0(self): """Test incdec_number with a number <0 after decrementing.""" with pytest.raises(urlutils.IncDecError): urlutils.incdec_number(QUrl('http://example.com/page_0.html'), 'decrement') def test_invalid_url(self): """Test if incdec_number rejects an invalid URL.""" with pytest.raises(urlutils.InvalidUrlError): urlutils.incdec_number(QUrl(""), "increment") def test_wrong_mode(self): """Test if incdec_number rejects a wrong parameter for incdec.""" valid_url = QUrl("http://example.com/0") with pytest.raises(ValueError): urlutils.incdec_number(valid_url, "foobar") def test_wrong_segment(self): """Test if incdec_number rejects a wrong segment.""" with pytest.raises(urlutils.IncDecError): urlutils.incdec_number(QUrl('http://example.com'), 'increment', segments={'foobar'}) @pytest.mark.parametrize("url, msg, expected_str", [ ("http://example.com", "Invalid", "Invalid: http://example.com"), ]) def test_incdec_error(self, url, msg, expected_str): """Test IncDecError.""" url = QUrl(url) with pytest.raises(urlutils.IncDecError) as excinfo: raise urlutils.IncDecError(msg, url) assert excinfo.value.url == url assert str(excinfo.value) == expected_str