Source code for psychopy.data.utils

#!/usr/bin/env python
# -*- coding: utf-8 -*-

# Part of the PsychoPy library
# Copyright (C) 2002-2018 Jonathan Peirce (C) 2019-2025 Open Science Tools Ltd.
# Distributed under the terms of the GNU General Public License (GPL).

import os
import re
import ast
import pickle
import time, datetime
import numpy as np
import pandas as pd

from collections import OrderedDict
from packaging.version import Version

from psychopy import logging, exceptions
from psychopy.tools.filetools import pathToString
from psychopy.localization import _translate

try:
    import openpyxl
    if Version(openpyxl.__version__) >= Version('2.4.0'):
        # openpyxl moved get_column_letter to utils.cell
        from openpyxl.utils.cell import get_column_letter
    else:
        from openpyxl.cell import get_column_letter
    from openpyxl.reader.excel import load_workbook
    haveOpenpyxl = True
except ImportError:
    haveOpenpyxl = False

haveXlrd = False

_nonalphanumeric_re = re.compile(r'\W')  # will match all bad var name chars


def checkValidFilePath(filepath, makeValid=True):
    """Checks whether file path location (e.g. is a valid folder)

    This should also check whether we have write-permissions to the folder
    but doesn't currently do that!

    added in: 1.90.00
    """
    folder = os.path.split(os.path.abspath(filepath))[0]
    if not os.path.isdir(folder):
        os.makedirs(folder)  # spit an error if we fail
    return True


def isValidVariableName(name):
    """Checks whether a certain string could be used as a valid variable.

    Usage::
        OK, msg, translated = isValidVariableName(name)

    >>> isValidVariableName('name')
    (True, '', '')
    >>> isValidVariableName('0name')
    (False, 'Variables cannot begin with numeric character', 'Variabiles non possunt incipere numerorum mores')
    >>> isValidVariableName('first.second')
    (False, 'Variables cannot contain punctuation or spaces', 'Variabiles non habet interpunctionem vel spatia')
    >>> isValidVariableName('first second')
    (False, 'Variables cannot contain punctuation or spaces', 'Variabiles non habet interpunctionem vel spatia')
    >>> isValidVariableName('')
    (False, "Variables cannot be missing, None, or ''", "Variabiles deesse non possunt, nemo, vel ''")
    >>> isValidVariableName(None)
    (False, "Variables cannot be missing, None, or ''", "Variabiles deesse non possunt, nemo, vel ''")
    >>> isValidVariableName(23)
    (False, "Variables must be string-like", "Variabiles debent esse linea-similis")
    >>> isValidVariableName('a_b_c')
    (True, '', '')
    """
    if not name:
        return (
            False,
            "Variables cannot be missing, None, or ''",
            _translate("Variables cannot be missing, None, or ''")
        )
    if not isinstance(name, str):
        return (
            False,
            "Variables must be string-like",
            _translate("Variables must be string-like")
        )
    try:
        name = str(name)  # convert from unicode if possible
    except Exception:
        if type(name) in [str, np.unicode_]:
            raise exceptions.ConditionsImportError(
                "name %s (type %s) contains non-ASCII characters (e.g. accents)" % (name, type(name)),
                translated=_translate("name %s (type %s) contains non-ASCII characters (e.g. accents)") % (name, type(name))
            )
        else:
            raise exceptions.ConditionsImportError(
                "name %s (type %s) could not be converted to a string",
                translated=_translate("name %s (type %s) could not be converted to a string") % (name, type(name))
            )

    if name[0].isdigit():
        return (
            False,
            "Variables cannot begin with numeric character",
            _translate("Variables cannot begin with numeric character")
        )
    if _nonalphanumeric_re.search(name):
        return (
            False,
            "Variables cannot contain punctuation or spaces",
            _translate("Variables cannot contain punctuation or spaces")
        )
    return True, '', ''


def _getExcelCellName(col, row):
    """Returns the excel cell name for a row and column (zero-indexed)

    >>> _getExcelCellName(0,0)
    'A1'
    >>> _getExcelCellName(2,1)
    'C2'
    """
    # BEWARE - openpyxl uses indexing at 1, to fit with Excel
    return "%s%i" % (get_column_letter(col + 1), row + 1)


def importTrialTypes(fileName, returnFieldNames=False):
    """importTrialTypes is DEPRECATED (as of v1.70.00)
    Please use `importConditions` for identical functionality.
    """
    logging.warning("importTrialTypes is DEPRECATED (as of v1.70.00). "
                    "Please use `importConditions` for identical "
                    "functionality.")
    return importConditions(fileName, returnFieldNames)


def sliceFromString(sliceString):
    """Convert a text string into a valid slice object
    which can be used as indices for a list or array.

    >>> sliceFromString("0:10")
    slice(0,10,None)
    >>> sliceFromString("0::3")
    slice(0,None,3)
    >>> sliceFromString("-8:")
    slice(-8,None,None)
    """
    sliceArgs = []
    for val in sliceString.split(':'):
        if len(val) == 0:
            sliceArgs.append(None)
        else:
            sliceArgs.append(int(round(float(val))))
            # nb int(round(float(x))) is needed for x='4.3'
    return slice(*sliceArgs)


def indicesFromString(indsString):
    """Convert a text string into a valid list of indices
    """
    # "6"
    try:
        inds = int(round(float(indsString)))
        return [inds]
    except Exception:
        pass
    # "-6::2"
    try:
        inds = sliceFromString(indsString)
        return inds
    except Exception:
        pass
    # "1,4,8"
    try:
        inds = list(eval(indsString))
        return inds
    except Exception:
        pass


def dictFromString(val):
    # return as-is if already a dict
    if isinstance(val, dict):
        return val
    # stringify
    if not isinstance(val, str):
        val = str(val)
    # strip spaces
    val = val.strip()
    # make sure we have curly braces
    if not val.startswith("{") and val.endswith("}"):
        val = f"{{{val}}}"
    # try to evaluate with ast (works for simple values)
    try:
        iterable = ast.literal_eval(val)
        assert isinstance(iterable, dict)
        return iterable
    except (ValueError, SyntaxError, AssertionError):
        pass  # e.g. "yes, no" won't work. We'll go on and try another way
    # try manually if ast fails
    parsed = {}
    for item in val[1:-1].split(","):
        if ":" in item:
            key, val = item.split(":", maxsplit=1)
            parsed[key.strip()] = val.strip()

    return parsed 


def listFromString(val, excludeEmpties=False):
    """Take a string that looks like a list (with commas and/or [] and make
    an actual python list"""
    # was previously called strToList and str2list might have been an option!
    # I'll leave those here for anyone doing a find-in-path for those
    if type(val) == tuple:
        return list(val)
    elif type(val) == list:
        return list(val)  # nothing to do
    elif type(val) != str:
        return [val]
    # try to evaluate with ast (works for "'yes,'no'" or "['yes', 'no']")
    try:
        iterable = ast.literal_eval(val)
        if type(iterable) == tuple:
            iterable = list(iterable)
        return iterable
    except (ValueError, SyntaxError):
        pass  # e.g. "yes, no" won't work. We'll go on and try another way

    val = val.strip()  # in case there are spaces
    if val.startswith(('[', '(')) and val.endswith((']', ')')):
        val = val[1:-1]
    asList = val.split(",")
    if excludeEmpties:
        asList = [this.strip() for this in asList if this]
    else:
        asList = [this.strip() for this in asList]
    return asList



[docs]
def importConditions(fileName, returnFieldNames=False, selection=""):
    """Imports a list of conditions from an .xlsx, .csv, or .pkl file

    The output is suitable as an input to :class:`TrialHandler`
    `trialList` or to :class:`MultiStairHandler` as a `conditions` list.

    If `fileName` ends with:

    - .csv:  import as a comma-separated-value file
            (header + row x col)
    - .xlsx: import as Excel 2007 (xlsx) files.
            No support for older (.xls) is planned.
    - .pkl:  import from a pickle file as list of lists
            (header + row x col)

    The file should contain one row per type of trial needed and one column
    for each parameter that defines the trial type. The first row should give
    parameter names, which should:

    - be unique
    - begin with a letter (upper or lower case)
    - contain no spaces or other punctuation (underscores are permitted)


    `selection` is used to select a subset of condition indices to be used
    It can be a list/array of indices, a python `slice` object or a string to
    be parsed as either option.
    e.g.:

    - "1,2,4" or [1,2,4] or (1,2,4) are the same
    - "2:5"       # 2, 3, 4 (doesn't include last whole value)
    - "-10:2:"    # tenth from last to the last in steps of 2
    - slice(-10, 2, None)  # the same as above
    - random(5) * 8  # five random vals 0-7

    """

    def _attemptImport(fileName):
        """Attempts to import file with specified settings and raises
        ConditionsImportError if fails due to invalid format

        :param filename: str
        :return: trialList, fieldNames
        """
        if fileName.endswith(('.csv', '.tsv')):
            trialsArr = None
            errs = []
            # list of possible delimiters
            delims = (",", ".", ";", "\t")
            # try a variety of separator / decimal pairs
            for sep, dec in [
                # most common in US, EU
                (',', '.'), 
                (';', ','),
                # other possible formats
                ('\t', '.'), 
                ('\t', ','), 
                (';', '.')
            ]:
                # try to load
                try:
                    thisAttempt = pd.read_csv(
                        fileName, encoding='utf-8-sig', sep=sep, decimal=dec
                    )
                    # read in the headers separately to bypass pandas sanitization
                    thisAttempt.columns = pd.read_csv(
                        fileName, encoding='utf-8-sig', sep=sep, decimal=dec, header=None, nrows=1
                    ).iloc[0, :]
                    # if there's only one header, check that it doesn't contain delimiters
                    # (one column with delims probably means it's parsed without error but not
                    # recognised columns correctly)
                    if len(thisAttempt.columns) == 1:
                        for delim in delims:
                            if delim in thisAttempt.columns[0]:
                                msg = _translate(
                                    "Could not load {}. \n"
                                    "Delimiter in heading: {} in {}."
                                ).format(fileName, delim, thisAttempt.columns[0])
                                err = exceptions.ConditionsImportError(msg)
                                errs.append(err)
                                raise err
                    # if it's all good, use received array
                    trialsArr = thisAttempt
                except Exception:
                    continue
                else:
                    # if successful, check the variable names
                    _assertValidVarNames(trialsArr.columns, fileName)
                    # skip other pairs now we've got it
                    break
            # if all options failed, raise last error
            if errs and trialsArr is None:
                raise errs[-1]
            elif trialsArr is None:
                raise ValueError(
                    _translate("Could not parse file {}.").format(fileName)
                )
            # if we made it herre, we successfully loaded the file
            for col in trialsArr.columns:
                for row, cell in enumerate(trialsArr[col]):
                    if isinstance(cell, str):
                        tryVal = cell.replace(",", ".")
                        try:
                            trialsArr[col][row] = float(tryVal)
                        except ValueError:
                            pass
            logging.debug(u"Read csv file with pandas: {}".format(fileName))
        elif fileName.endswith(('.xlsx', '.xlsm')):
            trialsArr = pd.read_excel(fileName, engine='openpyxl')
            logging.debug(u"Read Excel file with pandas: {}".format(fileName))
        elif fileName.endswith('.xls'):
            trialsArr = pd.read_excel(fileName, engine='xlrd')
            logging.debug(u"Read Excel file with pandas: {}".format(fileName))
        # then try to convert array to trialList and fieldnames
        unnamed = trialsArr.columns.to_series().str.contains('^Unnamed: ')
        trialsArr = trialsArr.loc[:, ~unnamed]  # clear unnamed cols
        logging.debug(u"Clearing unnamed columns from {}".format(fileName))
        trialList, fieldNames = pandasToDictList(trialsArr)

        return trialList, fieldNames

    def _assertValidVarNames(fieldNames, fileName):
        """screens a list of names as candidate variable names. if all
        names are OK, return silently; else raise  with msg
        """
        fileName = pathToString(fileName)
        # make sure all columns are named
        if not all(fieldNames):
            raise exceptions.ConditionsImportError(
                "Conditions file %s: Missing parameter name(s); empty cell(s) in the first row?" % fileName,
                translated=_translate("Conditions file %s: Missing parameter name(s); empty cell(s) in the first row?") % fileName
            )
        # check each name
        for name in fieldNames:
            # is this name duplicated?
            if sum([otherName == name for otherName in fieldNames]) > 1:
                raise exceptions.ConditionsImportError(_translate(
                "Duplicate column name '{}'"
            ).format(name))
            # is this name a valid variable name?
            OK, msg, translated = isValidVariableName(name)
            if not OK:
                # tailor message to importConditions
                msg = msg.replace('Variables', 'Parameters (column headers)')
                translated = msg.replace('Variables', 'Parameters (column headers)')
                raise exceptions.ConditionsImportError(
                    'Bad name: %s%s"%s"' % (name, os.linesep, msg),
                    translated='Bad name: %s%s"%s"' % (name, os.linesep, translated)
                )

    if fileName in ['None', 'none', None]:
        if returnFieldNames:
            return [], []
        return []
    if not os.path.isfile(fileName):
        raise exceptions.ConditionsImportError(
            "Conditions file not found: %s" % fileName,
            translated=_translate("Conditions file not found: %s") % fileName
        )

    def pandasToDictList(dataframe):
        """Convert a pandas dataframe to a list of dicts.
        This helper function is used by csv or excel imports via pandas
        """
        # convert the resulting dataframe to a numpy recarray
        trialsArr = dataframe.to_records(index=False)
        # Check for new line characters in strings, and replace escaped characters
        for record in trialsArr:
            for idx, element in enumerate(record):
                if isinstance(element, str):
                    record[idx] = element.replace('\\n', '\n')
        if trialsArr.shape == ():
            # convert 0-D to 1-D with one element:
            trialsArr = trialsArr[np.newaxis]
        fieldNames = list(trialsArr.dtype.names)
        _assertValidVarNames(fieldNames, fileName)

        # convert the record array into a list of dicts
        trialList = []
        for trialN, trialType in enumerate(trialsArr):
            thisTrial = OrderedDict()
            for fieldN, fieldName in enumerate(fieldNames):
                val = trialsArr[trialN][fieldN]

                if isinstance(val, str):
                    if val.startswith('[') and val.endswith(']'):
                        # val = eval('%s' %unicode(val.decode('utf8')))
                        val = eval(val)
                elif type(val) == np.bytes_:
                    val = str(val.decode('utf-8-sig'))
                    # if it looks like a list, convert it:
                    if val.startswith('[') and val.endswith(']'):
                        # val = eval('%s' %unicode(val.decode('utf8')))
                        val = eval(val)
                elif np.isnan(val):
                    val = None
                thisTrial[fieldName] = val
            trialList.append(thisTrial)
        return trialList, fieldNames

    if (fileName.endswith(('.csv', '.tsv'))
            or (fileName.endswith(('.xlsx', '.xls', '.xlsm')) and haveXlrd)):
        trialList, fieldNames = _attemptImport(fileName=fileName)

    elif fileName.endswith(('.xlsx','.xlsm')):  # no xlsread so use openpyxl
        if not haveOpenpyxl:
            raise exceptions.ConditionsImportError(
                "openpyxl or xlrd is required for loading excel files, but neither was found.",
                _translate("openpyxl or xlrd is required for loading excel files, but neither was found.")
            )

        # data_only was added in 1.8
        if Version(openpyxl.__version__) < Version('1.8'):
            wb = load_workbook(filename=fileName)
        else:
            wb = load_workbook(filename=fileName, data_only=True)
        ws = wb.worksheets[0]

        logging.debug(u"Read excel file with openpyxl: {}".format(fileName))
        try:
            # in new openpyxl (2.3.4+) get_highest_xx is deprecated
            nCols = ws.max_column
            nRows = ws.max_row
        except Exception:
            # version openpyxl 1.5.8 (in Standalone 1.80) needs this
            nCols = ws.get_highest_column()
            nRows = ws.get_highest_row()

        # get parameter names from the first row header
        fieldNames = []
        rangeCols = []
        for colN in range(nCols):
            if Version(openpyxl.__version__) < Version('2.0'):
                fieldName = ws.cell(_getExcelCellName(col=colN, row=0)).value
            else:
                # From 2.0, cells are referenced with 1-indexing: A1 == cell(row=1, column=1)
                fieldName = ws.cell(row=1, column=colN + 1).value
            if fieldName:
                # If column is named, add its name to fieldNames
                fieldNames.append(fieldName)
                rangeCols.append(colN)
        _assertValidVarNames(fieldNames, fileName)

        # loop trialTypes
        trialList = []
        for rowN in range(1, nRows):  # skip header first row
            thisTrial = {}
            for rangeColsIndex, colN in enumerate(rangeCols):
                if Version(openpyxl.__version__) < Version('2.0'):
                    val = ws.cell(_getExcelCellName(col=colN, row=0)).value
                else:
                    # From 2.0, cells are referenced with 1-indexing: A1 == cell(row=1, column=1)
                    val = ws.cell(row=rowN + 1, column=colN + 1).value
                # if it looks like a list or tuple, convert it
                if (isinstance(val, str) and
                        (val.startswith('[') and val.endswith(']') or
                                 val.startswith('(') and val.endswith(')'))):
                    val = eval(val)
                # if it has any line breaks correct them
                if isinstance(val, str):
                    val = val.replace('\\n', '\n')
                # Convert from eu style decimals: replace , with . and try to make it a float
                if isinstance(val, str):
                    tryVal = val.replace(",", ".")
                    try:
                        val = float(tryVal)
                    except ValueError:
                        pass
                fieldName = fieldNames[rangeColsIndex]
                thisTrial[fieldName] = val
            trialList.append(thisTrial)

    elif fileName.endswith('.pkl'):
        f = open(fileName, 'rb')
        # Converting newline characters.
        # 'b' is necessary in Python3 because byte object is
        # returned when file is opened in binary mode.
        buffer = f.read().replace(b'\r\n',b'\n').replace(b'\r',b'\n')
        try:
            trialsArr = pickle.loads(buffer)
        except Exception:
            raise exceptions.ConditionsImportError(
                'Could not open %s as conditions' % fileName,
                translated=_translate('Could not open %s as conditions') % fileName
            )
        f.close()
        trialList = []
        # In Python3, strings returned by pickle() are unhashable so we have to
        # convert them to str.
        trialsArr = [[str(item) if isinstance(item, str) else item
                      for item in row] for row in trialsArr]
        fieldNames = trialsArr[0]  # header line first
        _assertValidVarNames(fieldNames, fileName)
        for row in trialsArr[1:]:
            thisTrial = {}
            for fieldN, fieldName in enumerate(fieldNames):
                # type is correct, being .pkl
                thisTrial[fieldName] = row[fieldN]
            trialList.append(thisTrial)
    else:
        raise exceptions.ConditionsImportError(
            'Your conditions file should be an xlsx, csv, dlm, tsv or pkl file',
            translated=_translate('Your conditions file should be an xlsx, csv, dlm, tsv or pkl file')
        )

    # if we have a selection then try to parse it
    if isinstance(selection, str) and len(selection) > 0:
        selection = indicesFromString(selection)
        if not isinstance(selection, slice):
            for n in selection:
                try:
                    assert n == int(n)
                except AssertionError:
                    raise exceptions.ConditionsImportError(
                        "importConditions() was given some `indices` but could not parse them",
                        translated=_translate("importConditions() was given some `indices` but could not parse them")
                    )

    # the selection might now be a slice or a series of indices
    if isinstance(selection, slice):
        trialList = trialList[selection]
    elif len(selection) > 0:
        allConds = trialList
        trialList = []
        print(selection)
        print(len(allConds))
        for ii in selection:
            trialList.append(allConds[int(ii)])

    logging.exp('Imported %s as conditions, %d conditions, %d params' %
                (fileName, len(trialList), len(fieldNames)))
    if returnFieldNames:
        return (trialList, fieldNames)
    else:
        return trialList



def createFactorialTrialList(factors):
    """Create a trialList by entering a list of factors with names (keys)
    and levels (values) it will return a trialList in which all factors
    have been factorially combined (so for example if there are two factors
    with 3 and 5 levels the trialList will be a list of 3*5 = 15, each
    specifying the values for a given trial

    Usage::

        trialList = createFactorialTrialList(factors)

    :Parameters:

        factors : a dictionary with names (keys) and levels (values) of the
            factors

    Example::

        factors={"text": ["red", "green", "blue"],
                 "letterColor": ["red", "green"],
                 "size": [0, 1]}
        mytrials = createFactorialTrialList(factors)
    """

    # the first step is to place all the factorial combinations in a list of
    # lists
    tempListOfLists = [[]]
    for key in factors:
        # this takes the levels of each factor as a set of values
        # (a list) at a time
        alist = factors[key]
        tempList = []
        for value in alist:
            # now we loop over the values in a given list,
            # and add each value of the other lists
            for iterList in tempListOfLists:
                tempList.append(iterList + [key, value])
        tempListOfLists = tempList

    # this second step is so we can return a list in the format of trialList
    trialList = []
    for atrial in tempListOfLists:
        keys = atrial[0::2]  # the even elements are keys
        values = atrial[1::2]  # the odd elements are values
        atrialDict = {}
        for i in range(len(keys)):
            # this combines the key with the value
            atrialDict[keys[i]] = values[i]
        # append one trial at a time to the final trialList
        trialList.append(atrialDict)

    return trialList



[docs]
def bootStraps(dat, n=1):
    """Create a list of n bootstrapped resamples of the data

    SLOW IMPLEMENTATION (Python for-loop)

    Usage:
        ``out = bootStraps(dat, n=1)``

    Where:
        dat
            an NxM or 1xN array (each row is a different condition, each
            column is a different trial)
        n
            number of bootstrapped resamples to create

        out
            - dim[0]=conditions
            - dim[1]=trials
            - dim[2]=resamples
    """
    dat = np.asarray(dat)
    if len(dat.shape) == 1:
        # have presumably been given a series of data for one stimulus
        # adds a dimension (arraynow has shape (1,Ntrials))
        dat = np.array([dat])

    nTrials = dat.shape[1]
    # initialise a matrix to store output
    resamples = np.zeros(dat.shape + (n,), dat.dtype)
    rand = np.random.rand
    for stimulusN in range(dat.shape[0]):
        thisStim = dat[stimulusN, :]  # fetch data for this stimulus
        for sampleN in range(n):
            indices = np.floor(nTrials * rand(nTrials)).astype('i')
            resamples[stimulusN, :, sampleN] = np.take(thisStim, indices)
    return resamples




[docs]
def functionFromStaircase(intensities, responses, bins=10):
    """Create a psychometric function by binning data from a staircase
    procedure. Although the default is 10 bins Jon now always uses 'unique'
    bins (fewer bins looks pretty but leads to errors in slope estimation)

    usage::

        intensity, meanCorrect, n = functionFromStaircase(intensities,
                                                          responses, bins)

    where:
            intensities
                are a list (or array) of intensities to be binned

            responses
                are a list of 0,1 each corresponding to the equivalent
                intensity value

            bins
                can be an integer (giving that number of bins) or 'unique'
                (each bin is made from aa data for exactly one intensity
                value)

            intensity
                a numpy array of intensity values (where each is the center
                of an intensity bin)

            meanCorrect
                a numpy array of mean % correct in each bin

            n
                a numpy array of number of responses contributing to each mean
    """
    # convert to arrays
    try:
        # concatenate if multidimensional
        intensities = np.concatenate(intensities)
        responses = np.concatenate(responses)
    except Exception:
        intensities = np.array(intensities)
        responses = np.array(responses)

    # sort the responses
    sort_ii = np.argsort(intensities)
    sortedInten = np.take(intensities, sort_ii)
    sortedResp = np.take(responses, sort_ii)

    binnedResp = []
    binnedInten = []
    nPoints = []
    if bins == 'unique':
        intensities = np.round(intensities, decimals=8)
        uniqueIntens = np.unique(intensities)
        for thisInten in uniqueIntens:
            theseResps = responses[intensities == thisInten]
            binnedInten.append(thisInten)
            binnedResp.append(np.mean(theseResps))
            nPoints.append(len(theseResps))
    else:
        pointsPerBin = len(intensities)/bins
        for binN in range(bins):
            start = int(round(binN * pointsPerBin))
            stop = int(round((binN + 1) * pointsPerBin))
            thisResp = sortedResp[start:stop]
            thisInten = sortedInten[start:stop]
            binnedResp.append(np.mean(thisResp))
            binnedInten.append(np.mean(thisInten))
            nPoints.append(len(thisInten))

    return binnedInten, binnedResp, nPoints



def getDateStr(format="%Y-%m-%d_%Hh%M.%S.%f", fractionalSecondDigits=3):
    """Uses ``datetime.now().strftime(format)``_ to generate a string
    based on ISO 8601 but made safe for filename use::

        "2022-01-14_18h35.05.386"

    represents 14th Jan 2022 at 6:35pm with 5 sec and 386 ms

    This is often useful appended to data filenames to provide unique names.

    Parameters
    ----------
    format : str
        See the documentation for `datetime.datetime.strftime` for more
        information on format syntax:
        https://docs.python.org/3/library/datetime.html#strftime-strptime-behavior
        default="%Y-%m-%d_%Hh%M.%S.%f"
    fractionalSecondDigits : int
        An integer value 1-6 indicating the number of digits of fractional
        seconds to include if the `%f` parameter is included in the format.
        This would normally give 6 digits (microseconds) but to get just
        milliseconds you can set fractionalSecondDigits=3

    """
    now = datetime.datetime.now().astimezone()
    microsecs = now.strftime("%f")
    nowStr = now.strftime(format)
    if "%f" in format and (
            fractionalSecondDigits < 1
            or int(fractionalSecondDigits) != fractionalSecondDigits
    ):
        raise TypeError("fractionalSecondDigits argument to getDateStr should "
                        f"be an integer greater than 1, not {fractionalSecondDigits}")
    elif  "%f" in format and fractionalSecondDigits > len(microsecs):
        logging.warning("fractionalSecondDigits argument to getDateStr requested "
                        f"{fractionalSecondDigits} digits but only {len(microsecs)} "
                        f"are available. Truncating to {len(microsecs)}.")
    elif "%f" in format:
        nowStr = nowStr.replace(
            microsecs, microsecs[:int(fractionalSecondDigits)],
        )
    return nowStr


def parsePipeSyntax(key, stripKey=True):
    """
    Parse "pipe syntax" within an expInfo key / all keys in an expInfo dict. Pipe syntax is as follows:

    |req = Required input
    |cfg = Configuration parameter, hidden behind "read more" tag
    |fix = Fixed parameter, meaning its value can't be changed
    |hid = Hidden parameter, meaning it's not down by DlgFromDict

    An unescaped * in the key is considered shorthand for |req.

    Parameters
    ----------
    key : str
        A key to parse.
    stripKey : bool
        If True, trailing spaces will be removed from processed keys. Trailing spaces are removed from flags regardless.

    Returns
    -------
    str
        `value` with pipe syntax removed
    list
        List of flags found
    """
    # add |req if an unescaped * is present
    key = re.sub(r"(?<!\\)\*", "|req", key)
    # get flags
    key, *flags = key.split("|")
    # remove duplicates
    flags = list(set(flags))
    # strip key if requested
    if stripKey:
        key = key.strip()
    # strip each flag
    flags = [flag.strip() for flag in flags]

    return key, flags


def parsePipeSyntaxDict(expInfo, stripKey=True):
    """
    Calls `parsePipeSyntax` on each key in an expInfo dict and returns two new dicts: One with values against sanitized
    keys, the other with flags against processed keys.

    Parameters
    ----------
    expInfo : dict
        Dict whose flags to process
    stripKey : bool
        If True, trailing spaces will be removed from keys. Trailing spaces are removed from flags regardless.

    Returns
    -------
    dict
        The values from `expInfo` with processed keys, i.e. no pipe syntax
    dict
        The flags extraced from processing pipe syntax with processed keys, i.e. no pipe syntax
    """
    valuesDict = {}
    flagsDict = {}
    for key in expInfo:
        # parse key for syntax
        newKey, flags = parsePipeSyntax(key)
        # store original value under parsed key
        valuesDict[newKey] = expInfo[key]
        # store parsed flags under parsed key
        flagsDict[newKey] = flags

    return valuesDict, flagsDict