Mercurial > piecrust2
view piecrust/importing/base.py @ 1188:a7c43131d871
bake: Fix file write flushing problem with Python 3.8+
Writing the cache files fails in Python 3.8 because it looks like flushing
behaviour has changed. We need to explicitly flush. And even then, in very
rare occurrences, it looks like it can still run into racing conditions,
so we do a very hacky and ugly "retry" loop when fetching cached data :(
author | Ludovic Chabant <ludovic@chabant.com> |
---|---|
date | Tue, 15 Jun 2021 22:36:23 -0700 |
parents | 9093618aea08 |
children |
line wrap: on
line source
import os.path import shutil import codecs import logging import yaml from urllib.parse import urlparse from urllib.request import urlopen from piecrust.pathutil import SiteNotFoundError, multi_fnmatch_filter logger = logging.getLogger(__name__) class Importer(object): name = None description = None requires_website = True def setupParser(self, parser, app): raise NotImplementedError() def importWebsite(self, app, args): raise NotImplementedError() def checkedImportWebsite(self, ctx): if ctx.app.root_dir is None and self.requires_website: raise SiteNotFoundError() return self.importWebsite(ctx.app, ctx.args) class FileWalkingImporter(Importer): def setupParser(self, parser, app): parser.add_argument('--exclude', nargs='+', help=("Patterns of files and directories to exclude " "from the import (always includes `.git*`, " "`.hg*`, `.svn`, `.bzr`).")) def _startWalk(self, root_dir, exclude, *args, **kwargs): if exclude is None: exclude = [] exclude += ['.git*', '.hg*', '.svn', '.bzr'] for dirpath, dirnames, filenames in os.walk(root_dir): rel_dirpath = os.path.relpath(dirpath, root_dir) if rel_dirpath == '.': rel_dirpath = '' dirnames[:] = multi_fnmatch_filter( dirnames, exclude, modifier=lambda d: os.path.join(rel_dirpath, d), inverse=True) filenames = multi_fnmatch_filter( filenames, exclude, modifier=lambda f: os.path.join(rel_dirpath, f), inverse=True) for fn in filenames: full_fn = os.path.join(dirpath, fn) rel_fn = os.path.join(rel_dirpath, fn) logger.debug("Importing file: %s" % rel_fn) self._importFile(full_fn, rel_fn, *args, **kwargs) def create_page(app, rel_path, metadata, content): path = os.path.join(app.root_dir, rel_path) logging.info("Creating page: %s" % rel_path) header = yaml.dump(metadata) os.makedirs(os.path.dirname(path), 0o755, True) with codecs.open(path, 'w', encoding='utf8') as fp: fp.write("---\n") fp.write(header) fp.write("---\n") fp.write(content) def download_asset(app, url, rel_path=None, skip_if_exists=True): if rel_path is None: parsed_url = urlparse(url) rel_path = 'assets/' + parsed_url.path.lstrip('/') path = os.path.join(app.root_dir, rel_path) if skip_if_exists and os.path.exists(path): return logger.info("Downloading %s" % rel_path) os.makedirs(os.path.dirname(path), 0o755, True) with urlopen(url) as resp, open(path, 'wb') as fp: shutil.copyfileobj(resp, fp)