Source code for stixcore.processing.publish

import os
import sys
import shutil
import logging
import smtplib
import sqlite3
import argparse
import tempfile
import itertools
from io import StringIO
from enum import Enum
from pprint import pformat
from pathlib import Path
from datetime import date, datetime, timezone, timedelta
from collections import defaultdict

from paramiko import SSHClient
from scp import SCPClient

import astropy.units as u
from astropy.io import ascii, fits
from astropy.io.fits.diff import HDUDiff
from astropy.table import Table

from stixcore.config.config import CONFIG
from stixcore.ephemeris.manager import Spice, SpiceKernelManager
from stixcore.io.RidLutManager import RidLutManager
from stixcore.products.product import Product
from stixcore.time.datetime import SCETime
from stixcore.util.logging import get_logger
from stixcore.util.util import get_complete_file_name, is_incomplete_file_name

__all__ = ["PublishConflicts", "PublishHistoryStorage", "publish_fits_to_esa", "PublishHistoryStorage", "PublishResult"]

logger = get_logger(__name__)



[docs]
class PublishConflicts(Enum):
    """Cases of ESA publishing actions based on the history DB of already published files."""

    ADDED = 0
    """This files raises no conflicts so publishing without any errors or duplication handling"""

    SAME_ESA_NAME = 1
    """There are other files already published to ESA with the same resulting ESA file name.
    Truncated request id modifier"""

    SAME_EXISTS = 2
    """The very same files was published before nothing todo"""




[docs]
class PublishResult(Enum):
    """Result type for a FITS file published to ESA"""

    PUBLISHED = 10
    """All good files was published"""

    IGNORED = 11
    """This files was ignored and not published to ESA"""

    MODIFIED = 12
    """Other files with the same ESA file name have already be published.
    Therefore the filename was modified to a supplementary data product. (-sub1/2)"""

    BLACKLISTED = 13
    """This files was ignored via a blacklist and not published to ESA"""

    ERROR = 14
    """An error was raised during publication"""



class Capturing(list):
    """Context manager to read from stdout into a variable."""

    def __enter__(self):
        self._stdout = sys.stdout
        sys.stdout = self._stringio = StringIO()
        return self

    def __exit__(self, *args):
        self.extend(self._stringio.getvalue().splitlines())
        del self._stringio  # free up some memory
        sys.stdout = self._stdout



[docs]
class PublishHistoryStorage:
    """Persistent handler for meta data on already published files."""

    def __init__(self, filename):
        """Create a new persistent handler. Will open or create the given sqlite DB file.

        Parameters
        ----------
        filename : path like object
            path to the sqlite database file
        """
        self.conn = None
        self.cur = None
        self.filename = filename
        self._connect_database()

    def _connect_database(self):
        """Connects to the sqlite file or creates an empty one if not present."""
        try:
            self.conn = sqlite3.connect(self.filename)
            self.cur = self.conn.cursor()
            logger.info(f"PublishHistory DB loaded from {self.filename}")

            sql = """CREATE TABLE if not exists published (
                        id INTEGER PRIMARY KEY AUTOINCREMENT,
                        name TEXT UNIQUE NOT NULL,
                        path TEXT NOT NULL,
                        version INTEGER NOT NULL,
                        p_date FLOAT NOT NULL,
                        m_date FLOAT NOT NULL,
                        esaname TEXT NOT NULL,
                        modified_esaname TEXT,
                        result INTEGER
                    )
            """
            self.cur.execute(sql)
            self.cur.execute("CREATE INDEX if not exists esaname ON published (esaname)")
            self.cur.execute("CREATE INDEX if not exists p_date ON published (p_date)")

            self.conn.commit()
        except sqlite3.Error:
            logger.error(f"Failed load DB from {self.filename}")
            self.close()
            raise


[docs]
    def close(self):
        """Close the IDB connection."""
        if self.conn:
            self.conn.commit()
            self.conn.close()
            self.cur = None
        else:
            logger.warning("DB connection already closed")



[docs]
    def is_connected(self):
        """Is the handler connected to the db file.

        returns
        -------
        True | False
        """
        if self.cur:
            return True
        return False



[docs]
    def count(self):
        """Counts the number of entries in the DB

        Returns
        -------
        int
            number of tracked files
        """
        return self.cur.execute("select count(1) from published").fetchone()[0]



[docs]
    def add(self, path):
        """Adds a new file to the history.

        Parameters
        ----------
        path : path like object
            path to the FITS file to be published

        Returns
        -------
        (`PublishConflicts`, `list`)
            PublishConflicts with already published files and a list of all "conflicting files"
            including the newly added files as last entry.
        """
        name = path.name
        dir = str(path.parent)
        date = datetime.now().timestamp()
        parts = name[:-5].split("_")
        version = int(parts[4].lower().replace("v", "").replace("u", ""))
        esa_name = "_".join(parts[0:5])
        m_date = path.stat().st_ctime
        try:
            self.cur.execute(
                """insert into published
                                    (name, path, version, p_date, m_date, esaname)
                                    values(?, ?, ?, ?, ?, ?)""",
                (name, dir, version, date, m_date, esa_name),
            )
            others = self.find_by_esa_name(esa_name)
            if len(others) > 1:
                return (PublishConflicts.SAME_ESA_NAME, others)
            else:
                return (PublishConflicts.ADDED, others)
        except sqlite3.IntegrityError:
            return (PublishConflicts.SAME_EXISTS, self.find_by_name(name))


    def _execute(self, sql, arguments=None, result_type="list"):
        """Execute sql and return results in a list or a dictionary."""
        if not self.cur:
            raise Exception("DB is not initialized!")
        else:
            if arguments:
                self.cur.execute(sql, arguments)
            else:
                self.cur.execute(sql)
            if result_type == "list":
                rows = self.cur.fetchall()
            else:
                rows = [dict(zip([column[0] for column in self.cur.description], row)) for row in self.cur.fetchall()]
            return rows


[docs]
    def find_by_name(self, name):
        """Finds a history entry based on the file name (unique constraint).

        Parameters
        ----------
        name : `str`
            the file name

        Returns
        -------
        `hash`
            the history entry
        """
        return self._execute("select * from published where name = ?", (name,), result_type="hash")



[docs]
    def find_by_esa_name(self, esa_name):
        """Finds all history entries based on the the ESA name (not unique).

        Parameters
        ----------
        esa_name : `str`
            the truncated ESA file name of the fits file

        Returns
        -------
        `list`
            list of all found files with the same ESA file name
        """
        return self._execute(
            "select * from published where esaname = ? order by p_date asc", (esa_name,), result_type="hash"
        )



[docs]
    def set_modified_esa_name(self, name, id):
        """Updates the modified ESA file name of an entry.

        Parameters
        ----------
        name : `str`
            the new modified esa name
        id : `int`
            the id of the entry to update

        Returns
        -------
        `hash`
            the update result
        """
        return self._execute("update published set modified_esaname = ? where id = ? ", (name, id), result_type="hash")



[docs]
    def set_result(self, result, id):
        """Sets the result of a publishing action for a given file.

        Parameters
        ----------
        result : `PublishResult`
            the result
        id : `int`
            the id of the entry to update

        Returns
        -------
        `hash`
            the update result
        """
        return self._execute("update published set result = ? where id = ? ", (result.value, id), result_type="hash")



[docs]
    def get_all(self):
        """Queries all entries

        Returns
        -------
        `list`
            all found entries.
        """
        return self._execute("select * from published")




def send_mail_report(files):
    """Sends a report mail to configured receivers after each run.

    Parameters
    ----------
    files : dict
        all handled files grouped by the success/error state
    """
    if CONFIG.getboolean("Publish", "report_mail_send", fallback=False):
        try:
            sender = CONFIG.get("Pipeline", "error_mail_sender", fallback="")
            receivers = CONFIG.get("Publish", "report_mail_receivers").split(",")
            host = CONFIG.get("Pipeline", "error_mail_smpt_host", fallback="localhost")
            port = CONFIG.getint("Pipeline", "error_mail_smpt_port", fallback=25)
            smtp_server = smtplib.SMTP(host=host, port=port)
            su = (
                f"E {len(files[PublishResult.ERROR])} "
                f"I {len(files[PublishResult.IGNORED]) + len(files[PublishResult.BLACKLISTED])} "
                f"S {len(files[PublishResult.MODIFIED])} "
                f"P {len(files[PublishResult.PUBLISHED])}"
            )
            error = "" if len(files[PublishResult.ERROR]) <= 0 else "ERROR-"
            message = f"""Subject: StixCore TMTC Publishing {error}Report {su}


ERRORS (E)
**********
{pformat(files[PublishResult.ERROR])}

PUBLISHED ESA DUPLICATES (D)
****************************

RE-REQUESTED (I)
****************
{pformat(files[PublishResult.IGNORED])}

SUPPLEMENTS (S)
***************
{pformat(files[PublishResult.MODIFIED])}

BLACKLISTED (I)
***************
{pformat(files[PublishResult.BLACKLISTED])}

PUBLISHED (P)
*************
{pformat(files[PublishResult.PUBLISHED])}


StixCore

==========================

do not answer to this mail.
"""
            smtp_server.sendmail(sender, receivers, message)
        except Exception as e:
            logger.error(f"Error: unable to send report email: {e}")


def update_ephemeris_headers(fits_file, spice):
    """Updates all SPICE related data in FITS header and data table.

    Parameters
    ----------
    fits_file : Path
        path to FITS file
    spice : SpiceKernelManager
        Spice kernel manager with loaded spice kernels.
    """
    product = Product(fits_file)
    if product.level in ["L1", "L2", "ANC"]:
        ephemeris_headers = spice.get_fits_headers(
            start_time=product.utc_timerange.start, average_time=product.utc_timerange.center
        )
        with fits.open(fits_file, "update") as f:
            for hdu in f:
                now = datetime.now().isoformat(timespec="milliseconds")
                hdu.header["HISTORY"] = f"updated ephemeris header with latest kernel at {now}"
                # rename the header filename to be complete
                hdu.header["FILENAME"] = get_complete_file_name(hdu.header["FILENAME"])
                hdu.header.update(ephemeris_headers)
                # just update the first primary HDU
                break
        logger.info(f"updated ephemeris headers of {fits_file}")


def add_BSD_comment(p):
    """Adds a comment in the FITS header in case of BSD with the request ID and reason.

    Parameters
    ----------
    p : Path
        Path to FITS file

    Returns
    -------
    str
        the comment string in case of BSD
    """
    try:
        parts = p.name.split("_")
        if len(parts) > 5:
            rid = parts[5].replace(".fits", "")
            rid = int(rid.split("-")[0])

            reason = RidLutManager.instance.get_reason(rid)

            c_entry = f"BSD request id: '{rid}' reason: '{reason}'"
            fits.setval(p, "COMMENT", value=c_entry)
            return c_entry
    except Exception as e:
        logger.debug(e, exc_info=True)
        logger.info(f"no BSD request comment added nothing found in LUT for rid: {rid}")
    return ""


def add_history(p, name):
    """Adds a history entry in the FITS header that this files was published to SOAR with current date.

    Parameters
    ----------
    p : Path
        the path to the fits file
    name : str
        the ESA file name version of the FITS file.
    """
    time_formated = datetime.now().isoformat(timespec="milliseconds")
    h_entry = f"published to ESA SOAR as '{name}' on {time_formated}"
    fits.setval(p, "HISTORY", value=h_entry)


def copy_file(scp, p, target_dir, add_history_entry=True):
    """Copies FITS file to the designated SOAR out directory. Will use remote copy if set up.

    Parameters
    ----------
    scp : SCPClient
        A secure copy connection to a remote server.
        If None a copy to a folder on the local server is done.
    p : Path
        the path to the fits file
    target_dir : _type_
        the target directory where the file should be copied to.
        Local if scp is None otherwise on a remote server.
    add_history_entry : bool, optional
        should a History entry be added to the fits header while copy, by default True

    Returns
    -------
    (Done, Error)
        tuple (bool, Exception)
        went everything well if not also a possible Exception is returned
    """
    if add_history_entry:
        add_history(p, p.name)
    try:
        if scp:
            scp.put(p, remote_path=target_dir)
        else:
            shutil.copy(p, target_dir)
        return (True, None)
    except Exception as e:
        return (False, e)



[docs]
def publish_fits_to_esa(args):
    """CLI STIX publish to ESA processing step

    Parameters
    ----------
    args : list
        see -h for details

    Returns
    -------
    list
        list of published files
    """

    parser = argparse.ArgumentParser(
        description="STIX publish to ESA processing step", formatter_class=argparse.ArgumentDefaultsHelpFormatter
    )

    # paths
    parser.add_argument(
        "-t",
        "--target_dir",
        help="target directory where fits files should be copied to",
        default=CONFIG.get("Publish", "target_dir"),
        type=str,
    )

    # paths
    parser.add_argument(
        "-T",
        "--target_host",
        help="target host server where fits files should be copied to",
        default=CONFIG.get("Publish", "target_host", fallback="localhost"),
        type=str,
    )

    parser.add_argument(
        "-s",
        "--same_esa_name_dir",
        help=(
            "target directory where fits files should be copied to if there are "
            "any naming conflicts with already published files"
        ),
        default=CONFIG.get("Publish", "same_esa_name_dir"),
        type=str,
    )

    parser.add_argument(
        "-r",
        "--rid_lut_file",
        help=("Path to the rid LUT file"),
        default=CONFIG.get("Publish", "rid_lut_file"),
        type=str,
    )

    parser.add_argument(
        "--update_rid_lut",
        help="update rid lut file before publishing",
        default=False,
        action="store_true",
        dest="update_rid_lut",
    )

    parser.add_argument(
        "--sort_files",
        help="should the matched FITS be sorted by name before publishing.",
        default=False,
        action="store_true",
        dest="sort_files",
    )

    parser.add_argument(
        "--blacklist_files",
        help="input txt file with file names to that should not be delivered",
        default=None,
        type=str,
        dest="blacklist_files",
    )

    parser.add_argument(
        "--supplement_report",
        help="path to file where supplements and request reasons are summarized",
        default=CONFIG.get("Publish", "supplement_report", fallback=str(Path.home() / "supplement_report.csv")),
        type=str,
        dest="supplement_report",
    )

    parser.add_argument(
        "-d",
        "--db_file",
        help="Path to the history publishing database",
        type=str,
        default=CONFIG.get("Publish", "db_file", fallback=str(Path.home() / "published.sqlite")),
    )

    parser.add_argument(
        "-w",
        "--waiting_period",
        help="how long to wait after last file modification before publishing",
        default=CONFIG.get("Publish", "waiting_period", fallback="14d"),
        type=str,
    )

    parser.add_argument(
        "-n",
        "--batch_size",
        help="maximum number of files to publish at this run",
        default=CONFIG.getint("Publish", "batch_size", fallback=-1),
        type=int,
    )

    parser.add_argument(
        "-v",
        "--include_versions",
        help="what versions should be published",
        default=CONFIG.get("Publish", "include_versions", fallback="*"),
        type=str,
    )

    parser.add_argument(
        "-l",
        "--include_levels",
        help="what levels should be published",
        type=str,
        default=CONFIG.get("Publish", "include_levels", fallback="L0, L1, L2, ANC, LL03, CAL"),
    )

    parser.add_argument(
        "-p",
        "--include_products",
        help="what products should be published",
        type=str,
        default=CONFIG.get("Publish", "include_products", fallback="ql,hk,sci,asp,cal"),
    )

    parser.add_argument(
        "-f",
        "--fits_dir",
        help="input FITS directory for files to publish ",
        default=CONFIG.get("Publish", "fits_dir"),
        type=str,
    )

    parser.add_argument(
        "-o",
        "--log_dir",
        help="output directory for daily logging ",
        default=CONFIG.get("Publish", "log_dir", fallback=str(Path.home())),
        type=str,
        dest="log_dir",
    )

    parser.add_argument(
        "--log_level",
        help="the level of logging",
        default=None,
        type=str,
        choices=["CRITICAL", "ERROR", "WARNING", "INFO", "DEBUG", "NOTSET"],
        dest="log_level",
    )

    parser.add_argument("-S", "--spice_file", help="path to the spice meta kernel", default=None, type=str)

    args = parser.parse_args(args)

    logging.basicConfig(
        format="%(asctime)s %(message)s",
        force=True,
        filename=Path(args.log_dir) / f"pub_{date.today().strftime('%Y%m%d')}.log",
        filemode="a+",
    )

    if args.log_level:
        logging.getLogger().setLevel(logging.getLevelName(args.log_level))

    if args.spice_file:
        spicemeta = [Path(args.spice_file)]
    else:
        _spm = SpiceKernelManager(Path(CONFIG.get("Paths", "spice_kernels")))
        spicemeta = _spm.get_latest_mk()

    spice = Spice(spicemeta)
    Spice.instance = spice

    RidLutManager.instance = RidLutManager(Path(args.rid_lut_file), update=args.update_rid_lut)

    scp = None
    if args.target_host != "localhost":
        ssh = SSHClient()
        ssh.load_system_host_keys()
        ssh.connect(args.target_host)

        # SCPCLient takes a paramiko transport as an argument
        scp = SCPClient(ssh.get_transport())

    db_file = Path(args.db_file)
    fits_dir = Path(args.fits_dir)
    if not fits_dir.exists():
        logger.error(f"path not found to input files: {fits_dir}")
        return

    wait_period = u.Quantity(args.waiting_period)
    wait_period_s = wait_period.to(u.s).value

    LL_wait_period = u.Quantity(CONFIG.get("Publish", "LL_waiting_period", fallback="1min"))
    LL_wait_period_s = LL_wait_period.to(u.s).value

    target_dir = Path(args.target_dir)
    if (scp is None) and (not target_dir.exists()):
        logger.info(f"path not found to target dir: {target_dir} creating dir")
        target_dir.mkdir(parents=True, exist_ok=True)

    same_esa_name_dir = Path(args.same_esa_name_dir)
    if not same_esa_name_dir.exists():
        logger.info(f"path not found to target dir: {same_esa_name_dir} creating dir")
        same_esa_name_dir.mkdir(parents=True, exist_ok=True)

    include_levels = dict([(level, 1) for level in args.include_levels.lower().replace(" ", "").split(",")])

    if args.include_versions == "*":
        include_all_versions = True
    else:
        include_all_versions = False
        include_versions = dict(
            [
                (int(version), 1)
                for version in args.include_versions.lower().replace(" ", "").replace("v", "").split(",")
            ]
        )

    if args.include_products == "*":
        include_all_products = True
    else:
        include_all_products = False
        include_products = dict([(prod, 1) for prod in args.include_products.lower().replace(" ", "").split(",")])

    fits_candidates = fits_dir.rglob("solo_*.fits")
    img_candidates = fits_dir.rglob("solo_*.svg")
    candidates = itertools.chain(img_candidates, fits_candidates)
    to_publish = list()
    now = datetime.now().timestamp()
    next_week = datetime.now(timezone.utc) + timedelta(hours=24 * 7)
    hist = PublishHistoryStorage(db_file)
    n_candidates = 0

    blacklist_files = list()

    if args.blacklist_files:
        try:
            with open(args.blacklist_files) as f:
                for ifile in f:
                    try:
                        ifile = ifile.strip()
                        if len(ifile) > 1:
                            blacklist_files.append(ifile)
                    except Exception as e:
                        print(e)
                        print("skipping this blacklist file line")
            blacklist_files = set(blacklist_files)
        except OSError as e:
            print(e)
            print("Fall back to no blacklist files")

    supplement_report = None
    if args.supplement_report:
        args.supplement_report = Path(args.supplement_report)
        supplement_report = Table(names=["filename", "basefile", "comment"], dtype=[str, str, str])
        if not args.supplement_report.exists():
            ascii.write(supplement_report, args.supplement_report, delimiter="\t")

    tempdir = tempfile.TemporaryDirectory()
    tempdir_path = Path(tempdir.name)

    logger.info(f"db_file: {db_file}")
    logger.info(f"include_all_products: {include_all_products}")
    logger.info(f"include_products: {include_products}")
    logger.info(f"include_all_versions: {include_all_versions}")
    logger.info(f"include_versions: {include_all_products}")
    logger.info(f"include_levels: {include_levels}")
    logger.info(f"same_esa_name_dir: {same_esa_name_dir}")
    logger.info(f"target_dir: {target_dir}")
    logger.info(f"target_host: {args.target_host}")
    logger.info(f"scp: {scp is not None}")
    logger.info(f"wait_period: {wait_period}")
    logger.info(f"LL wait_period: {LL_wait_period}")
    logger.info(f"fits_dir: {fits_dir}")
    logger.info(f"temp_dir: {tempdir_path}")
    logger.info(f"rid_lut_file: {args.rid_lut_file}")
    logger.info(f"update_rid_lut: {args.update_rid_lut}")
    logger.info(f"update_rid_lut_url: {CONFIG.get('Publish', 'rid_lut_file_update_url')}")
    logger.info(f"sort file: {args.sort_files}")
    logger.info(f"blacklist files: {blacklist_files}")
    logger.info(f"supplement report: {args.supplement_report}")
    logger.info(f"batch size: {args.batch_size}")
    logger.info(f"send Mail report: {CONFIG.getboolean('Publish', 'report_mail_send')}")
    logger.info(f"receivers: {CONFIG.get('Publish', 'report_mail_receivers')}")
    logger.info(f"log dir: {args.log_dir}")
    logger.info(f"log level: {args.log_level}")
    logger.info(f"Spice: {spice.meta_kernel_path}")

    logger.info("\nstart publishing\n")
    published = defaultdict(list)

    for c in candidates:
        n_candidates += 1
        parts = c.stem.split("_")
        level = parts[1].lower()

        if not include_all_versions:
            version = int(parts[4].lower().replace("v", ""))
            if version not in include_versions:
                continue

        last_mod = c.stat().st_ctime

        # should the level by published
        if level not in include_levels:
            continue

        wp_s = LL_wait_period_s if level.startswith("ll") else wait_period_s

        # is the waiting time after last modification done
        if (now - last_mod) < wp_s:
            continue

        if not include_all_products:
            product = str(parts[2].lower().split("-")[1])
            if product not in include_products:
                continue

        old = hist.find_by_name(c.name)

        # was the same file already published
        if len(old) > 0:
            # as the added keyword by publishing will also change the mtime
            # we do not publish again - just with new name (version)
            # old = old[0]
            # if old['m_date'] == last_mod:
            continue

        if (args.batch_size >= 0) and (len(to_publish) >= args.batch_size):
            logger.info(f"batch size ({args.batch_size}) exceeded > stop looking for more files.")
            break
        to_publish.append(c)

    logger.info(f"#candidates: {n_candidates}")
    logger.info(f"#to_publish: {len(to_publish)}")

    if args.sort_files:
        to_publish = sorted(to_publish)

    for p in to_publish:
        try:
            isFits = p.suffix == ".fits"
            if isFits:
                comment = add_BSD_comment(p)

            if is_incomplete_file_name(p.name):
                p = p.rename(p.parent / get_complete_file_name(p.name))
                if isFits:
                    update_ephemeris_headers(p, spice)

            add_res, data = hist.add(p)

            if isFits:
                try:
                    # do not publish products from the future
                    p_header = fits.getheader(p)
                    if "DATE-BEG" in p_header and ":" not in p_header["DATE-BEG"]:
                        p_data_beg = datetime.fromisoformat(p_header["DATE-BEG"])
                    else:
                        p_data_beg = SCETime.from_float(p_header["OBT_BEG"] * u.s).to_datetime()
                    if p_data_beg > next_week:
                        hist.set_result(PublishResult.IGNORED, data[0]["id"])
                        published[PublishResult.IGNORED].append(data)
                        continue
                except Exception:
                    pass

            if p.name in blacklist_files:
                hist.set_result(PublishResult.BLACKLISTED, data[0]["id"])
                published[PublishResult.BLACKLISTED].append(data)
            elif add_res == PublishConflicts.ADDED:
                ok, error = copy_file(scp, p, target_dir, add_history_entry=isFits)
                if ok:
                    hist.set_result(PublishResult.PUBLISHED, data[0]["id"])
                    published[PublishResult.PUBLISHED].append(data)
                else:
                    hist.set_result(PublishResult.ERROR, data[0]["id"])
                    published[PublishResult.ERROR].append((p, error))
            elif add_res == PublishConflicts.SAME_EXISTS:
                # do nothing but add to report
                published[PublishResult.IGNORED].append(data)
            elif add_res == PublishConflicts.SAME_ESA_NAME and isFits:
                # esa naming conflict
                equal_data_once = False
                new_entry_id = None
                for f in data:
                    # do not test against itself
                    if p.name == f["name"]:
                        new_entry_id = f["id"]
                        continue
                    with fits.open(p) as a:
                        with fits.open(Path(f["path"]) / f["name"]) as b:
                            diff = HDUDiff(a["DATA"], b["DATA"], ignore_keywords=["*"])

                            if diff.identical:
                                equal_data_once = True
                                break

                # ignore re-requested data
                if equal_data_once:  # and new_entry_id:
                    hist.set_result(PublishResult.IGNORED, new_entry_id)
                    data[-1]["result"] = PublishResult.IGNORED
                    published[PublishResult.IGNORED].append(data)
                else:
                    # cases that covers the same time period but other configurations (pixel sets)

                    sup_nr = len([1 for d in data if d["modified_esaname"]]) + 1

                    # only allow for sup1 and sup2
                    if sup_nr > 2:
                        shutil.copy(p, same_esa_name_dir)
                        hist.set_result(PublishResult.IGNORED, new_entry_id)
                        published[PublishResult.ERROR].append((p, "max supplement error"))
                    else:
                        shutil.copy(p, tempdir_path)
                        old_name = p.name
                        parts = old_name.split("_")
                        parts[2] += f"-sup{sup_nr}"
                        new_name = "_".join(parts)

                        os.rename(tempdir_path / old_name, tempdir_path / new_name)
                        parent_comment = (
                            f"supplement data product combine with: {data[0]['name']}"
                            f". Orig filename of this supplement was {old_name}."
                        )
                        fits.setval(tempdir_path / new_name, "COMMENT", value=parent_comment)
                        fits.setval(tempdir_path / new_name, "FILENAME", value=new_name)

                        if args.supplement_report:
                            supplement_report.add_row([new_name, data[0]["name"], comment])

                        ok, error = copy_file(scp, tempdir_path / new_name, target_dir)
                        if ok:
                            hist.set_result(PublishResult.MODIFIED, new_entry_id)
                            data[-1]["result"] = PublishResult.MODIFIED

                            # also set the history entry in the header of the orig file
                            # to the temporary files it was already added by copyFile
                            add_history(p, new_name)

                            modified_esaname = "_".join(parts[:-1]) + ".fits"
                            hist.set_modified_esa_name(modified_esaname, new_entry_id)
                            data[-1]["modified_esaname"] = modified_esaname
                            published[PublishResult.MODIFIED].append(data)
                        else:
                            hist.set_result(PublishResult.ERROR, data[0]["id"])
                            published[PublishResult.ERROR].append((p, error))

            logger.info(f"processed file: {data} > {str(add_res)}")
        except Exception as e:
            published[PublishResult.ERROR].append((p, e))
            logger.error(e, exc_info=True)

    send_mail_report(published)
    if args.supplement_report:
        # append the new report
        with open(args.supplement_report, mode="a") as f:
            f.seek(0, os.SEEK_END)
            supplement_report.write(f, format="ascii.no_header", delimiter="\t")
    hist.close()
    tempdir.cleanup()
    return published



def main():
    publish_fits_to_esa(sys.argv[1:])


if __name__ == "__main__":
    main()