Mercurial > piecrust2

import os
import os.path
import time
import json
import queue
import logging
import itertools
import threading
from piecrust import CONFIG_PATH, THEME_CONFIG_PATH
from piecrust.pipelines.base import (
    PipelineJobCreateContext, PipelineJobRunContext, PipelineJobResult,
    PipelineManager)
from piecrust.pipelines.records import (
    MultiRecord, MultiRecordHistory)


logger = logging.getLogger(__name__)

# This flag is for cancelling all long running requests like SSEs.
server_shutdown = False


class PipelineStatusServerSentEventProducer(object):
    """ The producer for Server-Sent Events (SSE) notifying the front-end
        about useful things like assets having been re-processed in the
        background.
        Each has its own queue because the user could have multiple pages
        open, each having to display notifications coming from the server.
    """
    def __init__(self, proc_loop):
        self._proc_loop = proc_loop
        self._queue = queue.Queue()
        self._start_time = 0
        self._poll_interval = 0.5
        self._ping_interval = 30
        self._time_between_pings = 0
        self._running = 0

    def addBuildEvent(self, item):
        self._queue.put_nowait(item)

    def run(self):
        logger.debug("Starting pipeline status SSE.")
        self._proc_loop.addObserver(self)
        self._start_time = time.time()
        self._running = 1

        outstr = 'event: ping\ndata: started\n\n'
        yield bytes(outstr, 'utf8')

        while self._running == 1 and not server_shutdown:
            try:
                # We use a short poll interval (less than a second) because
                # we need to catch `server_shutdown` going `True` as soon as
                # possible to exit this thread when the user hits `CTRL+C`.
                data = self._queue.get(True, self._poll_interval)
            except queue.Empty:
                # Not exact timing but close enough.
                self._time_between_pings += self._poll_interval
                if self._time_between_pings >= self._ping_interval:
                    self._time_between_pings = 0
                    logger.debug("Sending ping/heartbeat event.")
                    outstr = 'event: ping\ndata: 1\n\n'
                    yield bytes(outstr, 'utf8')
                continue

            logger.debug("Sending pipeline status SSE.")
            outstr = (('event: %s\n' % data['type']) +
                      ('id: %s\n' % data['id']) +
                      ('data: %s\n\n' % json.dumps(data)))
            self._queue.task_done()
            yield bytes(outstr, 'utf8')

    def close(self):
        logger.debug("Closing pipeline status SSE.")
        self._proc_loop.removeObserver(self)
        self._running = 2


class _AssetProcessingInfo:
    def __init__(self, source):
        self.source = source
        self.paths = set()
        self.last_bake_time = time.time()


class ProcessingLoop(threading.Thread):
    def __init__(self, appfactory, out_dir):
        super().__init__(name='pipeline-reloader', daemon=True)
        self.appfactory = appfactory
        self.out_dir = out_dir
        self.last_status_id = 0
        self.interval = 1
        self._app = None
        self._proc_infos = None
        self._last_records = None
        self._last_config_mtime = 0
        self._obs = []
        self._obs_lock = threading.Lock()
        config_name = (
            THEME_CONFIG_PATH if appfactory.theme_site else CONFIG_PATH)
        self._config_path = os.path.join(appfactory.root_dir, config_name)

    def addObserver(self, obs):
        with self._obs_lock:
            self._obs.append(obs)

    def removeObserver(self, obs):
        with self._obs_lock:
            self._obs.remove(obs)

    def run(self):
        logger.debug("Initializing processing loop with output: %s" %
                     self.out_dir)
        try:
            self._init()
        except Exception as ex:
            logger.error("Error initializing processing loop:")
            logger.exception(ex)
            return

        logger.debug("Doing initial processing loop bake...")
        self._runPipelines()

        logger.debug("Running processing loop...")
        self._last_config_mtime = os.path.getmtime(self._config_path)

        while True:
            cur_config_time = os.path.getmtime(self._config_path)
            if self._last_config_mtime < cur_config_time:
                logger.info("Site configuration changed, reloading pipeline.")
                self._last_config_mtime = cur_config_time
                self._init()
                self._runPipelines()
                continue

            for procinfo in self._proc_infos.values():
                # For each assets folder we try to find the first new or
                # modified file. If any, we just run the pipeline on
                # that source.
                found_new_or_modified = False
                for item in procinfo.source.getAllContents():
                    path = item.spec
                    if path not in procinfo.paths:
                        logger.debug("Found new asset: %s" % path)
                        procinfo.paths.add(path)
                        found_new_or_modified = True
                        break
                    if os.path.getmtime(path) > procinfo.last_bake_time:
                        logger.debug("Found modified asset: %s" % path)
                        found_new_or_modified = True
                        break
                if found_new_or_modified:
                    self._runPipelines(procinfo.source)

            time.sleep(self.interval)

    def _init(self):
        self._app = self.appfactory.create()
        self._last_records = MultiRecord()

        self._proc_infos = {}
        for src in self._app.sources:
            if src.config['pipeline'] != 'asset':
                continue

            procinfo = _AssetProcessingInfo(src)
            self._proc_infos[src.name] = procinfo

            # Build the list of initial asset files.
            for item in src.getAllContents():
                procinfo.paths.add(item.spec)

    def _runPipelines(self, only_for_source=None):
        current_records = MultiRecord()
        record_histories = MultiRecordHistory(
            self._last_records, current_records)
        ppmngr = PipelineManager(
            self._app, self.out_dir, record_histories)

        # Create the pipelines, but also remember some stuff for what
        # we want to do.
        for src in self._app.sources:
            if src.config['pipeline'] != 'asset':
                continue
            if only_for_source is not None and src != only_for_source:
                continue

            ppmngr.createPipeline(src)

        for ppinfo in ppmngr.getPipelines():
            self._runPipeline(ppmngr, ppinfo)

        self.last_status_id += 1

        if self._last_records.success:
            for rec in self._last_records.records:
                changed = filter(
                    lambda i: not i.was_collapsed_from_last_run,
                    rec.getEntries())
                changed = itertools.chain.from_iterable(
                    map(lambda i: i.out_paths, changed))
                changed = list(changed)
                item = {
                    'id': self.last_status_id,
                    'type': 'pipeline_success',
                    'assets': changed}

                self._notifyObservers(item)
        else:
            item = {
                'id': self.last_status_id,
                'type': 'pipeline_error',
                'assets': []}
            for rec in self._last_records.records:
                for entry in rec.getEntries():
                    if entry.errors:
                        asset_item = {
                            'path': entry.item_spec,
                            'errors': list(entry.errors)}
                        item['assets'].append(asset_item)

                self._notifyObservers(item)

    def _runPipeline(self, ppmngr, ppinfo):
        src = ppinfo.source
        logger.debug("Running pipeline '%s' on: %s" %
                     (ppinfo.pipeline_name, src.name))

        # Set the time.
        procinfo = self._proc_infos[src.name]
        procinfo.last_bake_time = time.time()

        # Process all items in the source.
        pp = ppinfo.pipeline
        cr = ppinfo.record_history.current
        record_histories = ppmngr.record_histories
        current_records = record_histories.current
        jobctx = PipelineJobCreateContext(0, record_histories)
        jobs = pp.createJobs(jobctx)
        for job in jobs:
            runctx = PipelineJobRunContext(
                job, pp.record_name, record_histories)

            ppres = PipelineJobResult()
            ppres.record_entry = pp.createRecordEntry(job, runctx)

            try:
                pp.run(job, runctx, ppres)
            except Exception as e:
                ppres.record_entry.errors.append(str(e))

            if ppres.next_pass_job is not None:
                logger.error("The processing loop for the server "
                             "doesn't support multi-pass pipelines.")

            cr.addEntry(ppres.record_entry)
            if not ppres.record_entry.success:
                cr.success = False
                current_records.success = False
                logger.error("Errors found in %s:" % job.content_item.spec)
                for e in ppres.record_entry.errors:
                    logger.error("  " + e)

        # Do all the final stuff.
        ppmngr.postJobRun()
        ppmngr.deleteStaleOutputs()
        ppmngr.collapseRecords()
        ppmngr.shutdownPipelines()

        # Swap the old record with the next record.
        pr = ppinfo.record_history.previous
        logger.debug("Swapping record '%s' with '%s'." % (pr.name, cr.name))
        self._last_records.records.remove(pr)
        self._last_records.records.append(cr)

    def _notifyObservers(self, item):
        with self._obs_lock:
            observers = list(self._obs)
        for obs in observers:
            obs.addBuildEvent(item)
author	Ludovic Chabant <ludovic@chabant.com>
date	Thu, 15 Jun 2017 07:33:40 -0700
parents	c71472e6537f
children	342e3ea24b5d