development/doxygen/validationserver_8py_source.html

from typing import Dict, Any, List, Tuple

from glob import glob

import json

import functools

import time

import datetime

from multiprocessing import Process, Queue

import os.path

import argparse

import logging

import sys

import queue

import webbrowser

import re

import collections

import configparser

import requests


# 3rd

import cherrypy

import gitlab


# ours

import json_objects

from validationplots import create_plots

import validationfunctions

import validationpath


g_plottingProcesses: Dict[str, Tuple[Process, Queue, Dict[str, Any]]] = ({})


def get_revision_label_from_json_filename(json_filename: str) -> str:

    """

    Gets the label of a revision from the path to the revision.json file

    for example results/r121/revision.json

    will result in the label r121

    This is useful if the results folder has been moved by the user

    """

    folder_part = os.path.split(json_filename)[0]

    last_folder = os.path.basename(folder_part)


    return last_folder


def get_json_object_list(

    results_folder: str, json_file_name: str

) -> List[str]:

    """

    Searches one folder's sub-folder for json files of a    specific name and returns a combined list of the

    json file's content

    """


    search_string = results_folder + "/*/" + json_file_name


    found_revs = glob(search_string)

    found_rev_labels = []


    for r_file in found_revs:

        # try loading json file

        with open(r_file) as json_file:

            data = json.load(json_file)  # noqa


            # always use the folder name as label

            found_rev_labels.append(

                get_revision_label_from_json_filename(r_file)

            )


    return found_rev_labels


def deliver_json(file_name: str):

    """

    Simply load & parse a json file and return the

    python objects

    """


    with open(file_name) as json_file:

        data = json.load(json_file)

    return data


def create_revision_key(revision_names: List[str]) -> str:

    """

    Create a string key out of a revision list, which is handed to tho browser

    in form of a progress key

    """

    return functools.reduce(lambda x, y: x + "-" + y, revision_names, "")


def check_plotting_status(progress_key: str):

    """

    Check the plotting status via the supplied progress_key

    """


    if progress_key not in g_plottingProcesses:

        return None


    process, qu, last_status = g_plottingProcesses[progress_key]


    # read latest message

    try:

        # read as much entries from the queue as possible

        while not qu.empty():

            msg = qu.get_nowait()

            last_status = msg


            # update the last status

            g_plottingProcesses[progress_key] = (process, qu, last_status)

    except queue.Empty:

        pass


    return last_status


# todo: remove this, once we're certain that the bug was fixed!

def warn_wrong_directory():

    if not os.getcwd().endswith("html"):

        print(

            f"ERROR: Expected to be in HTML directory, but my current "

            f"working directory is {os.getcwd()}; abspath: {os.getcwd()}."

        )


# todo: limit the number of running plotting requests & terminate hanging ones

def start_plotting_request(

    revision_names: List[str], results_folder: str

) -> str:

    """

    Start a new comparison between the supplied revisions


    Returns:

        revision key

    """


    rev_key = create_revision_key(revision_names)


    # still running a plotting for this combination ?

    if rev_key in g_plottingProcesses:

        logging.info(f"Plotting request for {rev_key} still running")

        return rev_key


    # create queue to stream progress, only one directional from parent to

    # child

    qu = Queue()


    # start a new process for creating the plots

    p = Process(

        target=create_plots,

        args=(

            revision_names,

            False,

            qu,

            # go one folder up, because this function

            # expects the work dir, which contains

            # the results folder

            os.path.dirname(results_folder),

        ),

    )

    p.start()

    g_plottingProcesses[rev_key] = (p, qu, None)


    logging.info(f"Started process for plotting request {rev_key}")


    return rev_key


"""

Gitlab Integration


Under here are functions that enable the validationserver to

interact directly with the Gitlab project page to track and

update issues.


Requirement:

Config file with project information and access token in the local

machine. This is expected to be in the validation/config folder, in

the same root directory as the html_static files.


A check is performed to see if the config file exists with all the

relevant details and all of Gitlab functionalities are enabled/disabled

accordingly.


When the server is being set up, a Gitlab object is created, which

will be used subsequently to make all the API calls.


As a final server initialization step, the project is queried to

check if any of the current results are linked to existing issues

and the result files are updated accordingly.


The create/update issue functionality is accessible from the plot

container. All the relevant pages are part of the

validationserver cherry object.


Issues created by the validation server will contain a block of

automated code at the end of description and can be easily

filtered from the GitLab issues page using the search string

"Automated code, please do not delete". Relevant plots will be

listed as a note in the issue page, along with the revision label.


Function to upload files to Gitlab helps with pushing error plots

to the project.

"""


def get_gitlab_config(

    config_path: str

) -> configparser.ConfigParser:

    """

    Parse the configuration file to be used to authenticate

    GitLab API and retrieve relevant project info.


    Returns:

        gitlab configparser object

    """


    gitlab_config = configparser.ConfigParser()

    gitlab_config.read(config_path)


    return gitlab_config


def create_gitlab_object(config_path: str) -> gitlab.Gitlab:

    """

    Establish connection with Gitlab using a private access key and return

    a Gitlab object that can be used to make API calls. Default config

    from the passed ini file will be used.


    Returns:

        gitlab object

    """


    gitlab_object = gitlab.Gitlab.from_config(

        config_files=[config_path]

    )

    try:

        gitlab_object.auth()

        logging.info("Established connection with Gitlab")

    except gitlab.exceptions.GitlabAuthenticationError:

        gitlab_object = None

        logging.warning(

            "Issue with authenticating GitLab. "

            "Please ensure access token is correct and valid. "

            "GitLab Integration will be disabled."

        )

    except requests.exceptions.Timeout:

        gitlab_object = None

        logging.warning(

            "GitLab servers feeling under the weather, DESY outage? "

            "GitLab Integration will be disabled."

        )


    return gitlab_object


def get_project_object(

    gitlab_object: gitlab.Gitlab, project_id: str

) -> 'gitlab.project':

    """

    Fetch Gitlab project associated with the project ID.


    Returns:

        gitlab project object

    """


    project = gitlab_object.projects.get(project_id, lazy=True)


    return project


def search_project_issues(

    gitlab_object: gitlab.Gitlab,

    search_term: str,

    state: str = 'opened',

) -> 'list[gitlab.issues]':

    """

    Search in the Gitlab for open issues that contain the

    key phrase.


    Returns:

        gitlab project issues

    """


    issues = gitlab_object.issues.list(

        search=search_term,

        state=state,

        lazy=True,

        scope='all',

        get_all=True,

    )


    return issues


def update_linked_issues(

    gitlab_object: gitlab.Gitlab, cwd_folder: str

) -> None:

    """

    Fetch linked issues and update the comparison json files.


    Returns:

        None

    """


    # collect list of issues validation server has worked with

    search_key = "Automated code, please do not delete"

    issues = search_project_issues(gitlab_object, search_key)

    past_issues = search_project_issues(gitlab_object, search_key, 'closed')


    # find out the plots/scripts linked to the issues

    # store closed issue ids as -ve numbers to distinguish them from open ones

    plot_issues = collections.defaultdict(list)

    script_issues = collections.defaultdict(list)

    pattern = r"Relevant ([a-z]+): (\w+.*\w*)"

    for i, issue in enumerate(issues+past_issues):

        match = re.search(pattern, issue.description)

        if match:

            if match.groups()[0] == 'plot':

                if i >= len(issues):

                    plot_issues[match.groups()[1]].append(-issue.iid)

                else:

                    plot_issues[match.groups()[1]].append(issue.iid)

            else:

                script_issues[match.groups()[1]].append(issue.iid)


    # get list of available revision hashes

    rev_list = get_json_object_list(

        validationpath.get_html_plots_folder(cwd_folder),

        validationpath.file_name_comparison_json,

    )


    for r in rev_list:

        comparison_json_path = os.path.join(

            validationpath.get_html_plots_folder(cwd_folder),

            r,

            validationpath.file_name_comparison_json,

        )

        comparison_json = deliver_json(comparison_json_path)

        for package in comparison_json["packages"]:

            for plotfile in package.get("plotfiles"):

                for plot in plotfile.get("plots"):

                    if plot["png_filename"] in plot_issues.keys():

                        plot["issue"] = plot_issues[plot["png_filename"]]

                    else:

                        plot["issue"] = []


        with open(comparison_json_path, "w") as jsonFile:

            json.dump(comparison_json, jsonFile, indent=4)


    # get list of available revision labels

    rev_list = get_json_object_list(

            validationpath.get_results_folder(cwd_folder),

            validationpath.file_name_results_json,

        )

    for r in rev_list:

        revision_json_path = os.path.join(

                validationpath.get_results_folder(cwd_folder),

                r,

                validationpath.file_name_results_json,

            )

        revision_json = deliver_json(revision_json_path)

        for package in revision_json["packages"]:

            for scriptfile in package.get("scriptfiles"):

                if scriptfile["name"] in script_issues.keys():

                    scriptfile["issues"] = script_issues[scriptfile['name']]

                else:

                    scriptfile["issues"] = []


        with open(revision_json_path, "w") as jsonFile:

            json.dump(revision_json, jsonFile, indent=4)


def upload_file_gitlab(

    file_path: str, project: 'gitlab.project'

) -> Dict[str, str]:

    """

    Upload the passed file to the Gitlab project.


    Returns:

        uploaded gitlab project file object

    """


    uploaded_file = project.upload(

        file_path.split("/")[-1], filepath=file_path

    )


    return uploaded_file


def get_librarians(package: str) -> List[str]:

    """

    Function to get package librarian(s)' GitLab usernames. Temp solution

    until the .librarians file directly provides Gitlab usernames.


    Return:

        list of librarians' Gitlab usernames

    """


    usernames = []

    librarian_file = os.path.join(

        validationpath.get_basepath()['local'],

        package,

        '.librarians'

    )

    try:

        with open(librarian_file, 'r') as f:

            librarians = f.readlines()

    except FileNotFoundError:

        logging.exception(

            f"{librarian_file} couldn't be found. Corrupted package/librarian file?"

        )

        return usernames

    # Temp workaround to fetch DESY -> Gitlab map

    import importlib

    desy_map_path = os.path.join(

        "/home/b2soft/gitlab",

        "account_map.py"

    )

    spec = importlib.util.spec_from_file_location('account_map', desy_map_path)

    desy_map = importlib.util.module_from_spec(spec)

    try:

        spec.loader.exec_module(desy_map)

    except FileNotFoundError:

        logging.exception(

            f"{desy_map_path} couldn't be found. Have you setup Gitlab Webhook?"

        )

        return usernames


    for librarian in librarians:

        usernames.append(desy_map.get_gitlab_account(librarian.rstrip()))


    return usernames


def parse_contact(

        contact: str,

        map_file: str,

        package: str,

        gitlab_object: gitlab.Gitlab

) -> List[str]:

    """

    Parse string to find email id(s) and then match them with their Gitlab ids

    using the userid map.


    Returns :

        Dictionary with list of Gitlab IDs and corresponding list of

        Gitlab usernames.

    """


    email_regex = re.compile(r"([-!#-'*+/-9=?A-Z^-~]+(\.[-!#-'*+/-9=?A-Z^-~]+)*"

                             r"|\"([]!#-[^-~ \t]|(\\[\t -~]))+\")@([-!#-'*+/-9="

                             r"?A-Z^-~]+(\.[-!#-'*+/-9=?A-Z^-~]+)*|\[[\t -Z^-~]"

                             r"*])"

                             )

    email_ids = re.finditer(email_regex, contact)

    assignees = {

        'gitlab_ids': [],

        'usernames': [],

    }


    try:

        with open(map_file, 'r') as f:

            id_map = f.readlines()

    except FileNotFoundError:

        logging.exception(

            f"{map_file} couldn't be found. Did you get the location right?"

        )

        email_ids = []


    for email in email_ids:

        try:

            match = next(

                (line for line in id_map if email.group() in line), None

            )

            if not match:

                logging.error(

                    f"No userid found for {email} in the map, could it be that "

                    "they are (sadly) no longer in the collaboration?"

                )

                continue

            username = match.split(' ')[1].rstrip()

            assignees['usernames'].append(username)

        except IndexError:

            logging.error(

                f"Map info {match} does not match the required format for map "

                "'email gitlab_username'."

            )

            continue


    # Assign to librarian(s) if no contact found

    if not assignees['usernames']:

        assignees['usernames'] = get_librarians(package)

        logging.info(

            "Couldn't find contact/id so assigning issue to the"

            " package librarians."

        )


    for user in assignees['usernames']:

        try:

            assignees['gitlab_ids'].append(

                gitlab_object.users.list(username=user)[0].id

                )

        except IndexError:

            logging.error(

                f"Could not find {user} in Gitlab."

            )

            continue

    logging.info(

        "Issue will be assigned to "

        f"{[gitlab_object.users.get(id) for id in assignees['gitlab_ids']]}."

    )


    # to-do: add comment/note if no ids matched


    return assignees


def create_gitlab_issue(

    title: str,

    description: str,

    uploaded_file: Dict[str, str],

    assignees: Dict[str, List],

    package: str,

    project: 'gitlab.project'

) -> str:

    """

    Create a new project issue with the passed title, description and package,

    using Gitlab API.


    Returns:

        created issue id

    """


    issue = project.issues.create({"title": title,

                                   "description": description,

                                   "labels": [package, 'validation_issue']})


    issue_note = issue.notes.create(

        {"body": f'View the [error plot/log file]({uploaded_file["url"]}).'}

    )


    issue.assignee_ids = assignees['gitlab_ids']


    # Workaround for Gitlab not allowing multiple assignees

    if len(assignees['gitlab_ids']) > 1:

        related_users = [f'@{user} ' for user in assignees['usernames'][1:]]

        issue_note.body += f"\n\nPinging {' '.join(related_users)}"

        issue_note.save()


    issue.save()


    logging.info(f"Created a new Gitlab issue - {issue.iid}")


    return issue.iid


def update_gitlab_issue(

    issue_iid: str,

    uploaded_file: Dict[str, str],

    project: 'gitlab.project',

    file_path: str,

    rev_label: str

) -> None:

    """

    Update an existing project issue with the passed plotfile.


    Returns:

        None

    """


    issue = project.issues.get(issue_iid)

    name = file_path.split("/")[-1].split(".")[0]

    package = file_path.split("/")[-2]

    # check if this is a plot/script based on file format

    issue_type = 'plot'

    if 'log' == file_path.split("/")[-1].split(".")[-1]:

        issue_type = 'script'

    issue.notes.create(

        {

            "body": f'Related observation in validation of `{package}` package, `{name}`' +

            f'{issue_type} in `{rev_label}` build. View the [error plot/log file]({uploaded_file["url"]}).'

        }

    )


    issue.save()


    logging.info(f"Updated existing Gitlab issue {issue.iid}")


def update_scriptfile_issues_json(

        revision_json_path: str,

        scritptfile_name: str,

        scritptfile_package: str,

        issue_id: str

) -> None:

    """

    Update the scriptfile's linked issues key in the relevant revision's

    json file.


    Returns:

        None

    """


    revision_json = deliver_json(revision_json_path)

    for package in revision_json["packages"]:

        if package["name"] == scritptfile_package:

            for scriptfile in package.get("scriptfiles"):

                if (scriptfile["name"] == scritptfile_name):

                    scriptfile["issues"].append(issue_id)

                    break


    with open(revision_json_path, "w") as jsonFile:

        json.dump(revision_json, jsonFile, indent=4)


def update_plot_issues_json(

        comparison_json_path: str,

        plot_name: str,

        plot_package: str,

        issue_id: str

) -> None:

    """

    Update the plotfile's linked issues key in the relevant comparison

    json file.


    Returns:

        None

    """


    comparison_json = deliver_json(comparison_json_path)

    for package in comparison_json["packages"]:

        if package["name"] == plot_package:

            for plotfile in package.get("plotfiles"):

                for plot in plotfile.get("plots"):

                    if (plot["png_filename"] == plot_name):

                        plot["issue"].append(issue_id)

                        break


    with open(comparison_json_path, "w") as jsonFile:

        json.dump(comparison_json, jsonFile, indent=4)


class ValidationRoot:


    """

    Root Validation class to handle non-static HTTP requests into the

    validation server. The two main functions are to hand out compiled json

    objects of revisions and comparisons and to start and monitor the

    creation of comparison plots.


    """


    def __init__(self, working_folder, gitlab_object, gitlab_config, gitlab_map):

        """

        class initializer, which takes the path to the folders containing the

        validation run results and plots (aka comparison), gitlab object and

        config

        """


        self.working_folder = working_folder


        self.last_restart = datetime.datetime.now()


        self.version = validationfunctions.get_compact_git_hash(

            os.environ["BELLE2_LOCAL_DIR"]

        )


        self.gitlab_object = gitlab_object


        self.gitlab_config = gitlab_config


        self.gitlab_map = gitlab_map


        self.file_path = None


        self.revision_label = None


        self.contact = None


    @cherrypy.expose

    @cherrypy.tools.json_in()

    @cherrypy.tools.json_out()

    def create_comparison(self):

        """

        Triggers the start of a now comparison between the revisions supplied

        in revision_list

        """

        rev_list = cherrypy.request.json["revision_list"]

        logging.debug("Creating plots for revisions: " + str(rev_list))

        progress_key = start_plotting_request(

            rev_list,

            validationpath.get_results_folder(self.working_folder),

        )

        return {"progress_key": progress_key}


    @cherrypy.expose

    def index(self):

        """

        forward to the static landing page if

        the default url is used (like http://localhost:8080/)

        """

        raise cherrypy.HTTPRedirect("/static/validation.html")


    @cherrypy.expose

    def plots(self, *args):

        """

        Serve file from the html/plot directory.

        :param args: For the request /plots/a/b/c, these will be the strings

            "a", "b", "c"

        """


        warn_wrong_directory()


        if len(args) < 3:

            raise cherrypy.HTTPError(404)


        tag_folder = os.path.relpath(

            validationpath.get_html_plots_tag_comparison_folder(

                self.working_folder, args[:-2]

            ),

            validationpath.get_html_folder(self.working_folder),

        )

        path = os.path.join(tag_folder, *args[-2:])

        return cherrypy.lib.static.serve_file(path)


    @cherrypy.expose

    @cherrypy.tools.json_in()

    @cherrypy.tools.json_out()

    def check_comparison_status(self):

        """

        Checks on the status of a comparison creation

        """

        progress_key = cherrypy.request.json["input"]

        logging.debug("Checking status for plot creation: " + str(progress_key))

        status = check_plotting_status(progress_key)

        return status


    @cherrypy.expose

    @cherrypy.tools.json_out()

    def revisions(self, revision_label=None):

        """

        Return a combined json object with all revisions and

        mark the newest one with the field most_recent=true

        """


        # get list of available revision

        rev_list = get_json_object_list(

            validationpath.get_results_folder(self.working_folder),

            validationpath.file_name_results_json,

        )


        # always add the reference revision

        combined_list = []

        reference_revision = json.loads(

            json_objects.dumps(json_objects.Revision(label="reference"))

        )


        # load and combine

        for r in rev_list:

            full_path = os.path.join(

                validationpath.get_results_folder(self.working_folder),

                r,

                validationpath.file_name_results_json,

            )


            # update label, if dir has been moved

            lbl_folder = get_revision_label_from_json_filename(full_path)

            j = deliver_json(full_path)

            j["label"] = lbl_folder

            combined_list.append(j)


        # Sorting


        # Order by categories (nightly, release, etc.) first, then by date

        # A pure chronological order doesn't make sense, because we do not

        # have a linear history ((pre)releases branch off) and for the builds

        # the date corresponds to the build date, not to the date of the

        # actual commit.

        def sort_key(label: str):

            if "-" not in label:

                logging.warning(

                    f"Misformatted label encountered: '{label}' "

                    f"(doesn't seem to include date?)"

                )

                return label

            category, datetag = label.split("-", maxsplit=1)

            print(category, datetag)

            # Will later reverse order to bring items in the same category

            # in reverse chronological order, so the following list will have

            # the items in reverse order as well:

            order = ["release", "prerelease", "nightly"]

            try:

                index = order.index(category)

            except ValueError:

                index = 9

                logging.warning(

                    f"Misformatted label encountered: '{label}' (doesn't seem "

                    f"to belong to any known category?)"

                )

            return f"{index}-{datetag}"


        combined_list.sort(key=lambda rev: sort_key(rev["label"]), reverse=True)


        # reference always on top

        combined_list = [reference_revision] + combined_list


        # Set the most recent one ...

        newest_date = None

        newest_rev = None

        for r in combined_list:

            rdate_str = r["creation_date"]

            if isinstance(rdate_str, str):

                if len(rdate_str) > 0:

                    try:

                        rdate = time.strptime(rdate_str, "%Y-%m-%d %H:%M")

                    except ValueError:

                        # some old validation results might still contain

                        # seconds and therefore cannot properly be converted

                        rdate = None


                    if rdate is None:

                        continue


                    if newest_date is None:

                        newest_date = rdate

                        newest_rev = r

                    if rdate > newest_date:

                        newest_date = rdate

                        newest_rev = r


        for c in combined_list:

            if c["most_recent"] is not None:

                c["most_recent"] = False


        # if there are no revisions at all, this might also be just None

        if newest_rev:

            newest_rev["most_recent"] = True


        # topmost item must be dictionary for the ractive.os template to match

        return {"revisions": combined_list}


    @cherrypy.expose

    @cherrypy.tools.json_out()

    def comparisons(self, comparison_label=None):

        """

        return the json file of the comparison results of one specific

        comparison

        """


        warn_wrong_directory()


        # todo: Make this independent of our working directory!

        path = os.path.join(

            os.path.relpath(

                validationpath.get_html_plots_tag_comparison_folder(

                    self.working_folder, comparison_label.split(",")

                ),

                validationpath.get_html_folder(self.working_folder),

            ),

            "comparison.json",

        )


        # check if this comparison actually exists

        if not os.path.isfile(path):

            raise cherrypy.HTTPError(

                404, f"Json Comparison file {path} does not exist"

            )


        return deliver_json(path)


    @cherrypy.expose

    @cherrypy.tools.json_out()

    def system_info(self):

        """

        Returns:

            JSON file containing git versions and time of last restart

        """


        warn_wrong_directory()


        # note: for some reason %Z doesn't work like this, so we use

        # time.tzname for the time zone.

        return {

            "last_restart": self.last_restart.strftime("%-d %b %H:%M ")

            + time.tzname[1],

            "version_restart": self.version,

            "version_current": validationfunctions.get_compact_git_hash(

                os.environ["BELLE2_LOCAL_DIR"]

            ),

        }


    @cherrypy.expose

    def retrieve_file_metadata(self, filename):

        """

        Returns:

            Metadata(str) of the file

        """

        cherrypy.response.headers['Content-Type'] = 'text/plain'

        metadata = validationfunctions.get_file_metadata(filename)

        return metadata


    @cherrypy.expose

    @cherrypy.tools.json_in()

    @cherrypy.tools.json_out()

    def create_issue(self, title, description):

        """

        Call the functions to create the issue and redirect

        to the created Gitlab issue page.

        """


        # check if this is a plot/script based on file format

        issue_type = 'plot'

        if 'log' == self.file_path.split("/")[-1].split(".")[-1]:

            issue_type = 'script'

        default_section = self.gitlab_config['global']['default']

        project_id = self.gitlab_config[default_section]['project_id']

        # Create issue in the Gitlab project and save it

        project = get_project_object(self.gitlab_object, project_id)

        uploaded_file = upload_file_gitlab(self.file_path, project)

        assignees = {

            'gitlab_ids': [],

            'usernames': [],

        }

        file_name = self.file_path.split("/")[-1].split(".log")[0]

        file_package = self.file_path.split("/")[-2]

        if self.gitlab_map:

            assignees = parse_contact(

                self.contact, self.gitlab_map, file_package, self.gitlab_object

            )

        description += "\n\n---\n\n:robot: Automated code, please do not delete\n\n" + \

            f"Relevant {issue_type}: {file_name}\n\n" + \

            f"Revision label: {self.revision_label}\n\n---"

        issue_id = create_gitlab_issue(

            title, description, uploaded_file, assignees, file_package, project

        )

        project.save()


        # Update JSON with created issue id - script and plot info reside

        # in different locations and also have different structures.

        # todo - maybe this can be combined?

        if issue_type == 'script':

            revision_json_path = os.path.join(

                validationpath.get_results_folder(self.working_folder),

                self.revision_label,

                validationpath.file_name_results_json,

            )

            update_scriptfile_issues_json(

                revision_json_path, file_name, file_package, issue_id)

        else:

            comparison_json_path = os.path.join(

                validationpath.get_html_plots_folder(self.working_folder),

                self.file_path.split("/")[-3],

                "comparison.json",

            )

            update_plot_issues_json(

                comparison_json_path, file_name, file_package, issue_id)


        issue_url = self.gitlab_config[default_section]['project_url'] \

            + "/-/issues/" \

            + str(issue_id)

        raise cherrypy.HTTPRedirect(

            issue_url

        )


    @cherrypy.expose

    def issue(self, file_path, rev_label, contact):

        """

        Return a template issue creation interface

        for the user to add title and description.

        """

        self.file_path = os.path.join(

            validationpath.get_html_folder(self.working_folder), file_path

        )


        self.revision_label = rev_label

        self.contact = contact


        if not self.gitlab_object:

            return "ERROR: Gitlab integration not set up, verify config file."


        raise cherrypy.HTTPRedirect("/static/validation_issue.html")


    @cherrypy.expose

    def issue_redirect(self, iid):

        """

        Redirect to the Gitlab issue page.

        """

        default_section = self.gitlab_config['global']['default']

        if not self.gitlab_config[default_section]['project_url']:

            return "ERROR: Gitlab integration not set up, verify config file."


        issue_url = self.gitlab_config[default_section]['project_url'] \

            + "/-/issues/" \

            + str(iid)

        raise cherrypy.HTTPRedirect(

                issue_url

            )


    @cherrypy.expose

    def update_issue(self, id, file_path, rev_label):

        """

        Update existing issue in Gitlab with current result plot

        and redirect to the updated Gitlab issue page.

        """


        if not self.gitlab_object:

            return "ERROR: Gitlab integration not set up, verify config file."


        plot_path = os.path.join(

            validationpath.get_html_folder(self.working_folder), file_path

        )


        default_section = self.gitlab_config['global']['default']

        project_id = self.gitlab_config[default_section]['project_id']

        project = get_project_object(self.gitlab_object, project_id)

        uploaded_file = upload_file_gitlab(plot_path, project)

        update_gitlab_issue(

            id, uploaded_file, project, plot_path, rev_label

        )

        project.save()


        issue_url = self.gitlab_config[default_section]['project_url'] \

            + "/-/issues/" \

            + str(id)


        raise cherrypy.HTTPRedirect(

            issue_url

        )


def setup_gzip_compression(path, cherry_config):

    """

    enable GZip compression for all text-based content the

    web-server will deliver

    """


    cherry_config[path].update(

        {

            "tools.gzip.on": True,

            "tools.gzip.mime_types": [

                "text/html",

                "text/plain",

                "text/css",

                "application/javascript",

                "application/json",

            ],

        }

    )


def get_argument_parser():

    """

    Prepare a parser for all the known command line arguments

    """


    # Set up the command line parser

    parser = argparse.ArgumentParser()


    # Define the accepted command line flags and read them in

    parser.add_argument(

        "-ip",

        "--ip",

        help="The IP address on which the"

        "server starts. Default is '127.0.0.1'.",

        type=str,

        default="127.0.0.1",

    )

    parser.add_argument(

        "-p",

        "--port",

        help="The port number on which"

        " the server starts. Default is '8000'.",

        type=str,

        default=8000,

    )

    parser.add_argument(

        "-v",

        "--view",

        help="Open validation website" " in the system's default browser.",

        action="store_true",

    )

    parser.add_argument(

        "--production",

        help="Run in production environment: "

        "no log/error output via website and no auto-reload",

        action="store_true",

    )

    parser.add_argument(

        "-u",

        "--usermap",

        help="Path of file containing <email gitlab_username> map.",

        type=str,

        default=None,

    )


    return parser


def parse_cmd_line_arguments():

    """!

    Sets up a parser for command line arguments,

    parses them and returns the arguments.

    @return: An object containing the parsed command line arguments.

    Arguments are accessed like they are attributes of the object,

    i.e. [name_of_object].[desired_argument]

    """

    parser = get_argument_parser()

    # Return the parsed arguments!

    return parser.parse_args()


def run_server(

    ip="127.0.0.1",

    port=8000,

    parse_command_line=False,

    open_site=False,

    dry_run=False,

):


    # Setup options for logging

    logging.basicConfig(

        level=logging.DEBUG,

        format="%(asctime)s %(levelname)-8s %(message)s",

        datefmt="%H:%M:%S",

    )


    basepath = validationpath.get_basepath()

    cwd_folder = os.getcwd()


    # Only execute the program if a basf2 release is set up!

    if (

        os.environ.get("BELLE2_RELEASE_DIR", None) is None

        and os.environ.get("BELLE2_LOCAL_DIR", None) is None

    ):

        sys.exit("Error: No basf2 release set up!")


    cherry_config = dict()

    # just empty, will be filled below

    cherry_config["/"] = {}

    # will ensure also the json requests are gzipped

    setup_gzip_compression("/", cherry_config)


    # check if static files are provided via central release

    static_folder_list = ["validation", "html_static"]

    static_folder = None


    if basepath["central"] is not None:

        static_folder_central = os.path.join(

            basepath["central"], *static_folder_list

        )

        if os.path.isdir(static_folder_central):

            static_folder = static_folder_central


    # check if there is also a collection of static files in the local release

    # this overwrites the usage of the central release

    if basepath["local"] is not None:

        static_folder_local = os.path.join(

            basepath["local"], *static_folder_list

        )

        if os.path.isdir(static_folder_local):

            static_folder = static_folder_local


    if static_folder is None:

        sys.exit(

            "Either BELLE2_RELEASE_DIR or BELLE2_LOCAL_DIR has to set "

            "to provide static HTML content. Did you run b2setup ?"

        )


    # join the paths of the various result folders

    results_folder = validationpath.get_results_folder(cwd_folder)

    comparison_folder = validationpath.get_html_plots_folder(cwd_folder)


    logging.info(f"Serving static content from {static_folder}")

    logging.info(f"Serving result content and plots from {cwd_folder}")


    # check if the results folder exists and has at least one folder

    if not os.path.isdir(results_folder):

        sys.exit(

            f"Result folder {results_folder} does not exist, run validate_basf2 first " +

            "to create validation output"

        )


    results_count = sum(

        [

            os.path.isdir(os.path.join(results_folder, f))

            for f in os.listdir(results_folder)

        ]

    )

    if results_count == 0:

        sys.exit(

            f"Result folder {results_folder} contains no folders, run "

            f"validate_basf2 first to create validation output"

        )


    # Go to the html directory

    if not os.path.exists("html"):

        os.mkdir("html")

    os.chdir("html")


    if not os.path.exists("plots"):

        os.mkdir("plots")


    if os.path.exists("plots/rainbow.json"):

        logging.info("Removing old plots and unpopular combinations")

        validationfunctions.clear_plots(

            comparison_folder,

            validationfunctions.get_popular_revision_combinations(cwd_folder)

        )


    # export js, css and html templates

    cherry_config["/static"] = {

        "tools.staticdir.on": True,

        # only serve js, css, html and png files

        "tools.staticdir.match": r"^.*\.(js|css|html|png|js.map)$",

        "tools.staticdir.dir": static_folder,

    }

    setup_gzip_compression("/static", cherry_config)


    # export generated plots

    cherry_config["/plots"] = {

        "tools.staticdir.on": True,

        # only serve json and png files

        "tools.staticdir.match": r"^.*\.(png|json|pdf)$",

        "tools.staticdir.dir": comparison_folder,

    }

    setup_gzip_compression("/plots", cherry_config)


    # export generated results and raw root files

    cherry_config["/results"] = {

        "tools.staticdir.on": True,

        "tools.staticdir.dir": results_folder,

        # only serve root, log and txt files

        "tools.staticdir.match": r"^.*\.(log|root|txt)$",

        # server the log files as plain text files, and make sure to use

        # utf-8 encoding. Firefox might decide different, if the files

        # are located on a .jp domain and use Shift_JIS

        "tools.staticdir.content_types": {

            "log": "text/plain; charset=utf-8",

            "root": "application/octet-stream",

        },

    }


    setup_gzip_compression("/results", cherry_config)


    # Define the server address and port

    # only if we got some specific

    production_env = False

    if parse_command_line:

        # Parse command line arguments

        cmd_arguments = parse_cmd_line_arguments()


        ip = cmd_arguments.ip

        port = int(cmd_arguments.port)

        open_site = cmd_arguments.view

        production_env = cmd_arguments.production

        usermap_file = cmd_arguments.usermap


    cherrypy.config.update(

        {

            "server.socket_host": ip,

            "server.socket_port": port,

        }

    )

    if production_env:

        cherrypy.config.update({"environment": "production"})


    logging.info(f"Server: Starting HTTP server on {ip}:{port}")


    if open_site:

        webbrowser.open("http://" + ip + ":" + str(port))


    config_path = os.path.join(static_folder, '../config/gl.cfg')


    if not dry_run:

        # gitlab toggle

        gitlab_object = None

        gitlab_config = None

        gitlab_map = None

        if not os.path.exists(config_path):

            logging.warning(

                "ERROR: Expected to find config folder with Gitlab config,"

                f" but {config_path} doesn't exist. "

                "Gitlab features will not work."

            )

        else:

            gitlab_config = get_gitlab_config(config_path)

            gitlab_object = create_gitlab_object(config_path)

            if gitlab_object:

                update_linked_issues(gitlab_object, cwd_folder)

                gitlab_map = usermap_file

                logging.info(

                    f"{gitlab_map} will be used to assign issues."

                )


        cherrypy.quickstart(

            ValidationRoot(

                working_folder=cwd_folder,

                gitlab_object=gitlab_object,

                gitlab_config=gitlab_config,

                gitlab_map=gitlab_map,

            ),

            "/",

            cherry_config,

        )


if __name__ == "__main__":

    run_server()


json_objects.Revision
Definition: json_objects.py:34

validationserver.ValidationRoot
Definition: validationserver.py:651

validationserver.ValidationRoot.issue_redirect
def issue_redirect(self, iid)
Definition: validationserver.py:999

validationserver.ValidationRoot.contact
contact
placeholder variable for contact
Definition: validationserver.py:693

validationserver.ValidationRoot.check_comparison_status
def check_comparison_status(self)
Definition: validationserver.py:744

validationserver.ValidationRoot.create_comparison
def create_comparison(self)
Definition: validationserver.py:698

validationserver.ValidationRoot.gitlab_config
gitlab_config
Gitlab config.
Definition: validationserver.py:683

validationserver.ValidationRoot.last_restart
last_restart
Date when this object was instantiated.
Definition: validationserver.py:672

validationserver.ValidationRoot.comparisons
def comparisons(self, comparison_label=None)
Definition: validationserver.py:859

validationserver.ValidationRoot.version
version
Git version.
Definition: validationserver.py:675

validationserver.ValidationRoot.__init__
def __init__(self, working_folder, gitlab_object, gitlab_config, gitlab_map)
Definition: validationserver.py:661

validationserver.ValidationRoot.issue
def issue(self, file_path, rev_label, contact)
Definition: validationserver.py:981

validationserver.ValidationRoot.index
def index(self)
Definition: validationserver.py:712

validationserver.ValidationRoot.revisions
def revisions(self, revision_label=None)
Definition: validationserver.py:755

validationserver.ValidationRoot.gitlab_map
gitlab_map
Gitlab usermap.
Definition: validationserver.py:686

validationserver.ValidationRoot.retrieve_file_metadata
def retrieve_file_metadata(self, filename)
Definition: validationserver.py:908

validationserver.ValidationRoot.file_path
file_path
placeholder variable for path
Definition: validationserver.py:689

validationserver.ValidationRoot.working_folder
working_folder
html folder that contains plots etc.
Definition: validationserver.py:669

validationserver.ValidationRoot.update_issue
def update_issue(self, id, file_path, rev_label)
Definition: validationserver.py:1015

validationserver.ValidationRoot.create_issue
def create_issue(self, title, description)
Definition: validationserver.py:920

validationserver.ValidationRoot.plots
def plots(self, *args)
Definition: validationserver.py:720

validationserver.ValidationRoot.gitlab_object
gitlab_object
Gitlab object.
Definition: validationserver.py:680

validationserver.ValidationRoot.system_info
def system_info(self)
Definition: validationserver.py:888

validationserver.ValidationRoot.revision_label
revision_label
placeholder variable for revision label
Definition: validationserver.py:691

json_objects.dumps
def dumps(obj)
Definition: json_objects.py:614

validationfunctions.get_compact_git_hash
Optional[str] get_compact_git_hash(str repo_folder)
Definition: validationfunctions.py:55

validationfunctions.get_file_metadata
str get_file_metadata(str filename)
Definition: validationfunctions.py:737

validationfunctions.clear_plots
def clear_plots(str work_folder, List[str] keep_revisions)
Definition: validationfunctions.py:215

validationfunctions.get_popular_revision_combinations
List[str] get_popular_revision_combinations(str work_folder)
Definition: validationfunctions.py:136

validationpath.get_html_folder
def get_html_folder(output_base_dir)
Definition: validationpath.py:86

validationpath.get_basepath
def get_basepath()
Definition: validationpath.py:28

validationpath.get_html_plots_folder
def get_html_plots_folder(output_base_dir)
Definition: validationpath.py:93

validationpath.get_results_folder
def get_results_folder(output_base_dir)
Definition: validationpath.py:79

validationpath.get_html_plots_tag_comparison_folder
def get_html_plots_tag_comparison_folder(output_base_dir, tags)
Definition: validationpath.py:100