qutebrowser/scripts/importer.py

69 lines
2.0 KiB
Python
Raw Normal View History

#!/usr/bin/env python3
2014-10-15 20:43:47 +02:00
# vim: ft=python fileencoding=utf-8 sts=4 sw=4 et:
# Copyright 2014 Claude (longneck) <longneck@scratchbook.ch>
# This file is part of qutebrowser.
#
# qutebrowser is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# qutebrowser is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with qutebrowser. If not, see <http://www.gnu.org/licenses/>.
2014-10-15 06:20:54 +02:00
"""Tool to import data from other browsers.
Currently only importing bookmarks from Chromium is supported.
"""
2014-10-15 06:16:12 +02:00
import argparse
def main():
2014-10-15 06:18:43 +02:00
"""Main entry point."""
args = get_args()
if args.browser == 'chromium':
import_chromium(args.bookmarks)
2014-10-15 06:16:12 +02:00
def get_args():
"""Get the argparse parser."""
parser = argparse.ArgumentParser(
epilog="To import bookmarks from Chromium, export them to HTML in "
"Chromium's bookmark manager.")
2014-10-15 06:15:50 +02:00
parser.add_argument('browser', help="Which browser?", choices=['chromium'],
metavar='browser')
parser.add_argument('bookmarks', help="Bookmarks file")
args = parser.parse_args()
return args
2014-10-15 06:16:12 +02:00
def import_chromium(bookmarks_file):
2014-10-15 06:18:43 +02:00
"""Import bookmarks from a HTML file generated by Chromium."""
2014-10-15 06:17:00 +02:00
import bs4
2014-10-15 21:06:52 +02:00
with open(bookmarks_file, encoding='utf-8') as f:
soup = bs4.BeautifulSoup(f)
html_tags = soup.findAll('a')
bookmarks = []
for tag in html_tags:
if tag['href'] not in bookmarks:
2014-10-15 06:17:52 +02:00
bookmarks.append('{tag.string} {tag[href]}'.format(tag=tag))
for bookmark in bookmarks:
print(bookmark)
2014-10-15 06:16:12 +02:00
if __name__ == '__main__':
main()