2015-02-01 17:34:16 +01:00
|
|
|
# vim: ft=python fileencoding=utf-8 sts=4 sw=4 et:
|
|
|
|
|
2016-01-04 07:12:39 +01:00
|
|
|
# Copyright 2015-2016 Florian Bruhin (The Compiler) <mail@qutebrowser.org>
|
2015-02-01 17:34:16 +01:00
|
|
|
#
|
|
|
|
# This file is part of qutebrowser.
|
|
|
|
#
|
|
|
|
# qutebrowser is free software: you can redistribute it and/or modify
|
|
|
|
# it under the terms of the GNU General Public License as published by
|
|
|
|
# the Free Software Foundation, either version 3 of the License, or
|
|
|
|
# (at your option) any later version.
|
|
|
|
#
|
|
|
|
# qutebrowser is distributed in the hope that it will be useful,
|
|
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
# GNU General Public License for more details.
|
|
|
|
#
|
|
|
|
# You should have received a copy of the GNU General Public License
|
|
|
|
# along with qutebrowser. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
|
|
|
|
"""Simple history which gets written to disk."""
|
|
|
|
|
|
|
|
import time
|
2015-03-13 19:44:15 +01:00
|
|
|
import collections
|
2015-02-01 17:34:16 +01:00
|
|
|
|
2016-06-09 11:45:25 +02:00
|
|
|
from PyQt5.QtCore import pyqtSignal, QUrl, QObject
|
2015-02-01 17:34:16 +01:00
|
|
|
from PyQt5.QtWebKit import QWebHistoryInterface
|
|
|
|
|
2016-01-23 23:36:24 +01:00
|
|
|
from qutebrowser.commands import cmdutils
|
2015-04-10 06:40:48 +02:00
|
|
|
from qutebrowser.utils import utils, objreg, standarddir, log
|
2015-02-01 17:34:16 +01:00
|
|
|
from qutebrowser.config import config
|
2015-03-02 20:07:26 +01:00
|
|
|
from qutebrowser.misc import lineparser
|
2015-02-01 17:34:16 +01:00
|
|
|
|
|
|
|
|
|
|
|
class HistoryEntry:
|
|
|
|
|
|
|
|
"""A single entry in the web history.
|
|
|
|
|
|
|
|
Attributes:
|
|
|
|
atime: The time the page was accessed.
|
2015-03-16 07:03:01 +01:00
|
|
|
url: The URL which was accessed as QUrl.
|
|
|
|
url_string: The URL which was accessed as string.
|
2016-06-08 17:15:08 +02:00
|
|
|
hidden: If True, don't save this entry to disk
|
2015-02-01 17:34:16 +01:00
|
|
|
"""
|
|
|
|
|
2016-06-08 17:15:08 +02:00
|
|
|
def __init__(self, atime, url, title, hidden=False):
|
2015-03-12 08:07:40 +01:00
|
|
|
self.atime = float(atime)
|
2015-03-16 07:03:01 +01:00
|
|
|
self.url = QUrl(url)
|
|
|
|
self.url_string = url
|
2016-03-20 01:03:14 +01:00
|
|
|
self.title = title
|
2016-06-08 17:15:08 +02:00
|
|
|
self.hidden = hidden
|
2015-02-01 17:34:16 +01:00
|
|
|
|
|
|
|
def __repr__(self):
|
|
|
|
return utils.get_repr(self, constructor=True, atime=self.atime,
|
2016-06-08 17:15:08 +02:00
|
|
|
url=self.url.toDisplayString(), title=self.title,
|
|
|
|
hidden=self.hidden)
|
2015-02-01 17:34:16 +01:00
|
|
|
|
|
|
|
def __str__(self):
|
2016-03-20 01:03:14 +01:00
|
|
|
return '{} {} {}'.format(int(self.atime), self.url_string, self.title)
|
2015-02-01 17:34:16 +01:00
|
|
|
|
2016-06-08 15:38:52 +02:00
|
|
|
|
2016-06-09 11:45:25 +02:00
|
|
|
class WebHistoryInterface(QWebHistoryInterface):
|
2015-02-01 17:34:16 +01:00
|
|
|
|
2016-06-09 11:45:25 +02:00
|
|
|
"""Glue code between WebHistory and Qt's QWebHistoryInterface.
|
2015-03-02 22:44:43 +01:00
|
|
|
|
|
|
|
Attributes:
|
2016-06-09 11:45:25 +02:00
|
|
|
_history: The WebHistory object.
|
|
|
|
"""
|
|
|
|
|
|
|
|
def __init__(self, webhistory, parent):
|
|
|
|
super().__init__(parent)
|
|
|
|
self._history = webhistory
|
|
|
|
|
|
|
|
def addHistoryEntry(self, url_string):
|
|
|
|
"""Required for a QWebHistoryInterface impl, obsoleted by add_url."""
|
|
|
|
pass
|
|
|
|
|
|
|
|
def historyContains(self, url_string):
|
|
|
|
"""Called by WebKit to determine if an URL is contained in the history.
|
|
|
|
|
|
|
|
Args:
|
|
|
|
url_string: The URL (as string) to check for.
|
|
|
|
|
|
|
|
Return:
|
|
|
|
True if the url is in the history, False otherwise.
|
|
|
|
"""
|
|
|
|
return url_string in self._history.history_dict
|
|
|
|
|
|
|
|
|
|
|
|
class WebHistory(QObject):
|
|
|
|
|
|
|
|
"""The global history of visited pages.
|
|
|
|
|
|
|
|
Attributes:
|
|
|
|
history_dict: An OrderedDict of URLs read from the on-disk history.
|
2015-03-02 22:44:43 +01:00
|
|
|
_lineparser: The AppendLineParser used to save the history.
|
|
|
|
_new_history: A list of HistoryEntry items of the current session.
|
|
|
|
_saved_count: How many HistoryEntries have been written to disk.
|
2015-06-02 23:34:55 +02:00
|
|
|
_initial_read_started: Whether async_read was called.
|
|
|
|
_initial_read_done: Whether async_read has completed.
|
|
|
|
_temp_history: OrderedDict of temporary history entries before
|
|
|
|
async_read was called.
|
2015-03-15 21:16:45 +01:00
|
|
|
|
|
|
|
Signals:
|
2015-06-02 23:34:55 +02:00
|
|
|
add_completion_item: Emitted before a new HistoryEntry is added.
|
|
|
|
arg: The new HistoryEntry.
|
2015-03-15 21:16:45 +01:00
|
|
|
item_added: Emitted after a new HistoryEntry is added.
|
|
|
|
arg: The new HistoryEntry.
|
2016-01-23 23:36:24 +01:00
|
|
|
cleared: Emitted after the history is cleared.
|
2015-03-02 22:44:43 +01:00
|
|
|
"""
|
2015-02-01 17:34:16 +01:00
|
|
|
|
2015-06-02 23:34:55 +02:00
|
|
|
add_completion_item = pyqtSignal(HistoryEntry)
|
2015-03-09 03:33:05 +01:00
|
|
|
item_added = pyqtSignal(HistoryEntry)
|
2016-01-23 23:36:24 +01:00
|
|
|
cleared = pyqtSignal()
|
2015-06-02 23:34:55 +02:00
|
|
|
async_read_done = pyqtSignal()
|
2015-02-01 17:34:16 +01:00
|
|
|
|
|
|
|
def __init__(self, parent=None):
|
|
|
|
super().__init__(parent)
|
2015-06-02 23:34:55 +02:00
|
|
|
self._initial_read_started = False
|
|
|
|
self._initial_read_done = False
|
2015-03-02 22:44:43 +01:00
|
|
|
self._lineparser = lineparser.AppendLineParser(
|
2015-02-26 07:01:22 +01:00
|
|
|
standarddir.data(), 'history', parent=self)
|
2016-06-09 11:45:25 +02:00
|
|
|
self.history_dict = collections.OrderedDict()
|
2015-06-02 23:34:55 +02:00
|
|
|
self._temp_history = collections.OrderedDict()
|
2015-05-16 22:12:27 +02:00
|
|
|
self._new_history = []
|
|
|
|
self._saved_count = 0
|
|
|
|
objreg.get('save-manager').add_saveable(
|
|
|
|
'history', self.save, self.item_added)
|
|
|
|
|
|
|
|
def __repr__(self):
|
|
|
|
return utils.get_repr(self, length=len(self))
|
|
|
|
|
|
|
|
def __getitem__(self, key):
|
|
|
|
return self._new_history[key]
|
|
|
|
|
|
|
|
def __iter__(self):
|
2016-06-09 11:45:25 +02:00
|
|
|
return iter(self.history_dict.values())
|
2015-05-16 22:12:27 +02:00
|
|
|
|
|
|
|
def __len__(self):
|
2016-06-09 11:45:25 +02:00
|
|
|
return len(self.history_dict)
|
2015-05-16 22:12:27 +02:00
|
|
|
|
2015-06-02 23:34:55 +02:00
|
|
|
def async_read(self):
|
2015-05-16 22:12:27 +02:00
|
|
|
"""Read the initial history."""
|
2015-06-02 23:34:55 +02:00
|
|
|
if self._initial_read_started:
|
|
|
|
log.init.debug("Ignoring async_read() because reading is started.")
|
|
|
|
return
|
|
|
|
self._initial_read_started = True
|
|
|
|
|
2015-05-16 22:12:27 +02:00
|
|
|
if standarddir.data() is None:
|
2015-06-02 23:34:55 +02:00
|
|
|
self._initial_read_done = True
|
|
|
|
self.async_read_done.emit()
|
2015-05-16 22:12:27 +02:00
|
|
|
return
|
2015-06-02 23:34:55 +02:00
|
|
|
|
2015-03-02 22:44:43 +01:00
|
|
|
with self._lineparser.open():
|
|
|
|
for line in self._lineparser:
|
2015-06-02 23:34:55 +02:00
|
|
|
yield
|
2016-03-20 01:03:14 +01:00
|
|
|
data = line.rstrip().split(maxsplit=2)
|
2015-03-16 10:45:50 +01:00
|
|
|
if not data:
|
|
|
|
# empty line
|
|
|
|
continue
|
2016-03-20 01:03:14 +01:00
|
|
|
elif len(data) == 2:
|
|
|
|
atime, url = data
|
|
|
|
title = ""
|
|
|
|
elif len(data) == 3:
|
|
|
|
atime, url, title = data
|
|
|
|
else:
|
2015-04-10 06:40:48 +02:00
|
|
|
# other malformed line
|
|
|
|
log.init.warning("Invalid history entry {!r}!".format(
|
|
|
|
line))
|
|
|
|
continue
|
2015-05-13 23:46:22 +02:00
|
|
|
if atime.startswith('\0'):
|
2016-05-08 22:08:08 +02:00
|
|
|
log.init.debug(
|
2015-05-13 23:46:22 +02:00
|
|
|
"Removing NUL bytes from entry {!r} - see "
|
|
|
|
"https://github.com/The-Compiler/qutebrowser/issues/"
|
|
|
|
"670".format(data))
|
|
|
|
atime = atime.lstrip('\0')
|
2015-03-12 08:12:59 +01:00
|
|
|
# This de-duplicates history entries; only the latest
|
|
|
|
# entry for each URL is kept. If you want to keep
|
|
|
|
# information about previous hits change the items in
|
|
|
|
# old_urls to be lists or change HistoryEntry to have a
|
|
|
|
# list of atimes.
|
2016-03-20 01:03:14 +01:00
|
|
|
entry = HistoryEntry(atime, url, title)
|
2015-06-02 23:34:55 +02:00
|
|
|
self._add_entry(entry)
|
|
|
|
|
|
|
|
self._initial_read_done = True
|
|
|
|
self.async_read_done.emit()
|
|
|
|
|
|
|
|
for url, entry in self._temp_history.items():
|
|
|
|
self._add_entry(entry)
|
2016-06-08 17:15:08 +02:00
|
|
|
if not entry.hidden:
|
|
|
|
self._new_history.append(entry)
|
|
|
|
self.add_completion_item.emit(entry)
|
2015-06-02 23:34:55 +02:00
|
|
|
|
|
|
|
def _add_entry(self, entry, target=None):
|
2016-06-09 11:45:25 +02:00
|
|
|
"""Add an entry to self.history_dict or another given OrderedDict."""
|
2015-06-02 23:34:55 +02:00
|
|
|
if target is None:
|
2016-06-09 11:45:25 +02:00
|
|
|
target = self.history_dict
|
2015-06-02 23:34:55 +02:00
|
|
|
target[entry.url_string] = entry
|
|
|
|
target.move_to_end(entry.url_string)
|
2015-03-13 19:45:43 +01:00
|
|
|
|
2015-03-02 22:44:43 +01:00
|
|
|
def get_recent(self):
|
|
|
|
"""Get the most recent history entries."""
|
|
|
|
old = self._lineparser.get_recent()
|
|
|
|
return old + [str(e) for e in self._new_history]
|
2015-02-01 23:12:02 +01:00
|
|
|
|
2015-02-01 17:34:16 +01:00
|
|
|
def save(self):
|
|
|
|
"""Save the history to disk."""
|
2015-03-02 22:44:43 +01:00
|
|
|
new = (str(e) for e in self._new_history[self._saved_count:])
|
|
|
|
self._lineparser.new_data = new
|
2015-03-02 20:07:26 +01:00
|
|
|
self._lineparser.save()
|
2015-03-02 22:44:43 +01:00
|
|
|
self._saved_count = len(self._new_history)
|
2015-02-01 17:34:16 +01:00
|
|
|
|
2016-01-23 23:36:24 +01:00
|
|
|
@cmdutils.register(name='history-clear', instance='web-history')
|
|
|
|
def clear(self):
|
2016-06-08 16:49:07 +02:00
|
|
|
"""Clear all browsing history.
|
|
|
|
|
|
|
|
Note this only clears the global history
|
|
|
|
(e.g. `~/.local/share/qutebrowser/history` on Linux) but not cookies,
|
|
|
|
the back/forward history of a tab, cache or other persistent data.
|
|
|
|
"""
|
2016-01-23 23:36:24 +01:00
|
|
|
self._lineparser.clear()
|
2016-06-09 11:45:25 +02:00
|
|
|
self.history_dict.clear()
|
2016-01-23 23:36:24 +01:00
|
|
|
self._temp_history.clear()
|
|
|
|
self._new_history.clear()
|
|
|
|
self._saved_count = 0
|
|
|
|
self.cleared.emit()
|
|
|
|
|
2016-06-08 17:15:08 +02:00
|
|
|
def add_url(self, url_string, title="", hidden=False):
|
2015-02-01 17:34:16 +01:00
|
|
|
"""Called by WebKit when an URL should be added to the history.
|
|
|
|
|
|
|
|
Args:
|
|
|
|
url_string: An url as string to add to the history.
|
2016-06-08 17:15:08 +02:00
|
|
|
hidden: Whether to hide the entry from the on-disk history
|
2015-02-01 17:34:16 +01:00
|
|
|
"""
|
2015-04-02 09:09:17 +02:00
|
|
|
if not url_string:
|
|
|
|
return
|
2015-06-02 23:34:55 +02:00
|
|
|
if config.get('general', 'private-browsing'):
|
|
|
|
return
|
2016-06-08 17:15:08 +02:00
|
|
|
entry = HistoryEntry(time.time(), url_string, title, hidden=hidden)
|
2015-06-02 23:34:55 +02:00
|
|
|
if self._initial_read_done:
|
|
|
|
self._add_entry(entry)
|
2016-06-08 17:15:08 +02:00
|
|
|
if not entry.hidden:
|
|
|
|
self.add_completion_item.emit(entry)
|
|
|
|
self._new_history.append(entry)
|
|
|
|
self.item_added.emit(entry)
|
2015-06-02 23:34:55 +02:00
|
|
|
else:
|
|
|
|
self._add_entry(entry, target=self._temp_history)
|
2015-02-01 17:34:16 +01:00
|
|
|
|
|
|
|
|
|
|
|
|
2015-04-06 00:10:37 +02:00
|
|
|
def init(parent=None):
|
|
|
|
"""Initialize the web history.
|
|
|
|
|
|
|
|
Args:
|
|
|
|
parent: The parent to use for WebHistory.
|
|
|
|
"""
|
|
|
|
history = WebHistory(parent)
|
2015-02-01 17:34:16 +01:00
|
|
|
objreg.register('web-history', history)
|
2016-06-09 11:45:25 +02:00
|
|
|
|
|
|
|
interface = WebHistoryInterface(history, parent=history)
|
|
|
|
QWebHistoryInterface.setDefaultInterface(interface)
|