Source code for boon.logic

# Boolean Network analysis module
# Author: Franck Delaplace
# Creation date: January 2024

# In comments :
# DEF means definition which is a code part gathering functions related to a process or an object definition,
# STEP means main steps
# WARNING is a warning.

import inspect
import pulp
import sys
import z3
from pulp import PULP_CBC_CMD
from sympy import symbols
from collections.abc import Callable
from sympy.core.symbol import Symbol
from sympy.logic.boolalg import And, Or, Not, Implies, Equivalent, Xor, Xnor, Boolean, BooleanTrue, BooleanFalse
from sympy.logic.boolalg import is_cnf
from tqdm import tqdm

# Dictionary defining the output style of the formula, see prettyform also used for from_textfile and to_textfile.
# The type determines the type of the formula for operators which differ from And, Or, Not.
# let OP be an operator: prefix prints OP( <parameters>), infix prints <p1> OP <p2> ..., and normal form restrict the formula to a normal form and prohibit these operators.
LOGICAL: dict = {'type': 'infix', And: '\u2227', Or: '\u2228', Implies: '\u21D2', Equivalent: '\u21D4', Xor: '\u22BB', Not: '\u00AC', False: 'false', True: 'true'}
MATHEMATICA: dict = {'type': 'prefix', '(': "[", ')': "]",
                     And: '&&', Or: '||', Xor: 'Xor', Xnor: 'Xnor', Implies: 'Implies', Equivalent: 'Equivalent', Not: '!', False: 'False', True: 'True'}
SYMPY: dict = {'type': 'prefix', '(': "(", ')': ")",
               And: '&', Or: '|', Implies: 'Implies', Xor: 'Xor', Xnor: 'Xnor', Equivalent: 'Equivalent', Not: '~', False: 'False', True: 'True'}
JAVA: dict = {'type': 'normal form', And: "&&", Or: "||", Not: "!", False: 'false', True: 'true'}
C: dict = {'type': 'normal form', And: "&&", Or: "||", Not: "!", False: '0', True: '1'}
BOOLNET: dict = {'type': 'normal form', And: "&", Or: "|", Not: "!", False: "0", True: "1"}

SOLVER = PULP_CBC_CMD  # Default PULP solver
PATHSEP: str = "\\"  # Separator in the file path.

prime_implicants_problem = None  # Global variable storing the last prime implicants problem specification.
trc_clauses = 0  # global variables counting the number of CNF clauses in supercnf function
trc_cnf = 0  # global variables counting the number of clauses converted to CNF in supercnf function
nb_implicants = 0  # global variables counting the number of prime implicants in prime_implicants


# DEF: Basic functions

[docs]
def errmsg(msg: str, arg="", kind: str = "ERROR") -> None:
    """
    Display an error message and exit in case of error (kind = "ERROR").

    :param msg: The error message.
    :param arg: The argument of the error message (Default: "" no args).
    :param kind: Type of error (Default: ERROR). Only the "ERROR" option will exit the application.
    :type msg: str
    :type arg: str
    :type kind: str
    :return: None
    :rtype: None
    """

    print(f"** {kind}: {inspect.stack()[1].filename.split(PATHSEP)[-1]} - {inspect.stack()[1].function}: {msg}: {arg}")
    if kind == "ERROR":
        exit()




[docs]
def firstsymbol(formula):
    """ Extract the first symbol from the symbols of a dnf.

    :param formula: The input dnf.
    :type formula: Sympy formula
    :return: the first symbol."""
    if isinstance(formula, bool | BooleanFalse | BooleanTrue):  # The formula is reduced to a Boolean value, no symbols.
        return None
    else:  # The formula has at least 1 symbol.
        return next(iter(formula.free_symbols))



# DEF: Functions decomposing a formula.

[docs]
def cnf2clauses(cnf):
    """ Decomposition of a CNF into a sequence of clauses.

    :param cnf: CNF formula
    :type cnf: sympy formula
    :return: sequence of clauses.
    :rtype: Tuple[formula]"""
    if isinstance(cnf, And):  # The cnf is plain (And of Or-clauses).
        clauses = cnf.args
    elif isinstance(cnf, bool | BooleanFalse | BooleanTrue):  # The cnf is reduced to a boolean value.
        clauses = ()
    else:
        clauses = (cnf,)  # Otherwise, the cnf is reduced to a single clause.
    return clauses




[docs]
def clause2literals(clause) -> set:
    """Convert a clause or a cube into of a sequence of literals.

    :param  clause: The clause or cube.
    :type clause: Sympy formula
    :return: set of literals.
    :rtype: Set"""
    if isinstance(clause, Symbol | Not):  # clause reduced to a single literal.
        literals_clause = {clause}
    elif isinstance(clause, bool | BooleanFalse | BooleanTrue):  # clause reduced to Boolean value.
        literals_clause = set()
    else:  # plain clause.
        literals_clause = set(clause.args)
    return literals_clause



# DEF: Functions converting the formula into another style.

[docs]
def prettyform(formula, style: dict = LOGICAL, depth=0):
    """Return a string of a formula in nice form.

    :param formula: The input formula.
    :param style: The style of the logical operators (Default: LOGICAL)
    :param depth: the current depth of the formula for setting parentheses (Default: 0)
    :type formula: sympy formula
    :type style: dict
    :type depth: int"""
    if isinstance(formula, bool | BooleanFalse | BooleanTrue):
        return style[formula]
    elif isinstance(formula, Symbol):
        return str(formula)
    elif isinstance(formula, Not):
        return style[Not] + prettyform(formula.args[0], style, depth + 1)
    elif isinstance(formula, And | Or):
        new_formula = " {} ".format(style[type(formula)]).join(map(lambda f: prettyform(f, style, depth + 1), formula.args))
        return new_formula if depth == 0 else "(" + new_formula + ")"
    else:  # other operators than Or, And
        try:
            match style['type']:
                case 'infix':
                    new_formula = " {} ".format(style[type(formula)]).join(map(lambda f: prettyform(f, style, depth + 1), formula.args))
                    return new_formula if depth == 0 else "(" + new_formula + ")"
                case 'prefix':
                    return style[type(formula)] + style["("] + ", ".join(map(lambda f: prettyform(f, style, 0), formula.args)) + style[")"]
                case 'normal form':
                    errmsg("Normal form formula only", formula)
                case _:
                    errmsg("Internal program error on style", style['type'])
        except KeyError:
            errmsg(f"Unknown operator of type {type(formula)}", formula)




[docs]
def sympy2z3(formula):
    """Convert a sympy formula to z3 formula.

    :param formula: The formula to convert.
    :type formula: Sympy formula
    :return: the equivalent z3 formula.
    :rtype: Z3 formula"""
    if isinstance(formula, bool):
        return formula
    elif isinstance(formula, BooleanTrue):
        return True
    elif isinstance(formula, BooleanFalse):
        return False
    elif isinstance(formula, Symbol):
        return z3.Bool(formula.name)
    elif isinstance(formula, Not):
        return z3.Not(sympy2z3(formula.args[0]))
    elif isinstance(formula, Or):
        return z3.Or([*map(sympy2z3, formula.args)])
    elif isinstance(formula, And):
        return z3.And([*map(sympy2z3, formula.args)])
    elif isinstance(formula, Implies):
        return z3.Implies(sympy2z3(formula.args[0]), sympy2z3(formula.args[1]))
    elif isinstance(formula, Equivalent):
        return sympy2z3(formula.args[0]) == sympy2z3(formula.args[1])
    else:
        errmsg("a piece of the formula is not recognized", formula)



# DEF: CNF conversion
TEITSIN: str = "_t6n"  # prefix of the new variables introduced in Teitsin conversion
_varcounter = 0  # counter1 used in newvar.



[docs]
def newvar(initialize: int | None = None):
    """Create a new sympy symbol of the form <prefix><number>. The prefix is given by TSEITIN constant.

     :param initialize: Initialize the counter if the value is an integer or let the counter increment by 1 if it is set to None (Default value = None)
     :type  initialize: int|None
     :return: a Simpy symbol.
     :rtype: Symbol"""
    global _varcounter
    if initialize is not None:
        _varcounter = initialize
    else:
        _varcounter = _varcounter + 1
    return symbols("{prefix}{counter:d}".format(prefix=TEITSIN, counter=_varcounter))




[docs]
def tseitin(formula):
    """ Characterize the Tseitin form of a formula.
    TEITSIN constant prefixes the additional variables.

    :param formula: The formula.
    :type formula: Sympy formula
    :return: a pair: Tseitin variable, Tseitin CNF.
    :rtype: Tuple"""
    if isinstance(formula, bool | BooleanFalse | BooleanTrue):
        return formula, True
    elif isinstance(formula, Symbol):
        return formula, True
    elif isinstance(formula, Not):
        # (¬ p ∨ ¬ p1) ∧ (p ∨ p1) ∧ c1
        p = newvar()
        p1, c1 = tseitin(formula.args[0])
        return p, And(Or(Not(p), Not(p1)), Or(p, p1), c1)
    elif isinstance(formula, Or):
        #  p, (¬p ∨ p1 ∨ p2) ∧ (p ∨ ¬p1) ∧ (p ∨ ¬p2) ∧ c1 ∧ c2)
        p = newvar()
        p1, c1 = tseitin(formula.args[0])
        p2, c2 = tseitin(Or(*formula.args[1:]))
        return p, And(Or(Not(p), p1, p2), Or(p, Not(p1)), Or(p, Not(p2)), c1, c2)
    elif isinstance(formula, And):
        # p, (p ∨ ¬p1 ∨ ¬p2) ∧ (¬p ∨ p1) ∧ (¬p ∨ p2) ∧ c1∧ c2
        p = newvar()
        p1, c1 = tseitin(formula.args[0])
        p2, c2 = tseitin(And(*formula.args[1:]))
        return p, And(Or(p, Not(p1), Not(p2)), Or(Not(p), p1), Or(Not(p), p2), c1, c2)
    elif isinstance(formula, Implies):
        # p , (¬p ∨ ¬p1∨ p2) ∧ (p ∨ p1) ∧ (p ∨ ¬p2) ∧ c1∧ c2
        p = newvar()
        p1, c1 = tseitin(formula.args[0])
        p2, c2 = tseitin(formula.args[1])
        return p, And(Or(Not(p), Not(p1), p2), Or(p, p1), Or(p, Not(p2)), c1, c2)
    elif isinstance(formula, Equivalent):
        # p, (¬p ∨¬p1 ∨ p2)∧(¬p ∨ p1 ∨ ¬p2)∧(p ∨ ¬p1 ∨ ¬p2)∧(p ∨ p1 ∨ p2) ∧ c1 ∧ c2)
        p = newvar()
        p1, c1 = tseitin(formula.args[0])
        p2, c2 = tseitin(formula.args[1])
        return p, And(Or(Not(p), Not(p1), p2), Or(Not(p), p1, Not(p2)),
                      Or(p, Not(p1), Not(p2)), Or(p, p1, p2), c1, c2)
    else:
        errmsg("a piece of the formula is not recognized:", formula)
        return symbols("__failed__"), False




[docs]
def tseitin_cnf(formula):
    """Convert a formula to CNF using Tseitin method.

    :param formula: The formula to be converted.
    :type formula: Sympy formula
    :return: CNF formula.
    :rtype: Sympy formula"""
    newvar(0)  # initialize the counter1
    p, f = tseitin(formula)
    return And(p, f)




[docs]
def supercnf(formula, trace: bool = False):
    """ Convert the formula to CNF. The method is well adapted to large formula.

    :param formula: The formula to convert.
    :param trace: Boolean flag if True trace the computational steps (Default value = False)
    :type formula: sympy formula
    :type trace: bool
    :return: CNF formula
    :rtype: sympy formula
    """
    # Most of the classical methods cannot perform the CNF conversion on large formula in acceptable time (cf. to_cnf sympy, pyeda)
    # To overcome this disabling limitation, we design another method based on SAT solver.
    # Basically, let f be a formula, we define the CNF as ¬(SAT(¬f)) as ¬¬f = f, namely the negation of the satisfiable models of ¬f.
    # Let f be a formula, we compute all the models for ¬f. For each datamodel if x = True then return ~x and x if x=False.
    # The SAT solver must necessarily admit non CNF formula and be efficient. We use z3 solver which answers to these requirements.
    # This was really challenging to find an efficient method to convert very large formula in CNF, Yep! I did it :-)
    global trc_clauses
    global trc_cnf
    solver = z3.Solver()  # initialize Z3 solver
    solver.add(sympy2z3(Not(formula)))  # add the negation of the formula.

    # Enumerate all models
    models = []
    trc_clauses = 0
    while solver.check() == z3.sat:
        model = solver.model()
        trc_clauses += 1
        if trace: tqdm.write(f'\rBooN CNF >> # SAT models:[{trc_clauses:5d}]', end='')

        models.append(model)
        # Block the current datamodel to enable the finding of another datamodel.
        block = [sol() != model[sol] for sol in model]
        solver.add(z3.Or(block))  # if x=True, y= False, then add x != True or y != False as constraint disabling the selection of the datamodel.

    # Convert the models into a CNF by negating the datamodel: x=True → ~x, x=False → x
    if trace:
        tqdm.write('')
        cnf = And(*[Or(*map(lambda sol: Not(symbols(str(sol))) if models[trc_cnf][sol] else symbols(str(sol)), models[trc_cnf]))
                    for trc_cnf in tqdm(range(len(models)), file=sys.stdout, ascii=False, desc='BooN CNF >> CNF formatting', ncols=80,
                                        bar_format='{desc}: {percentage:3.0f}% |{bar}[{n_fmt:5s} - {elapsed} - {rate_fmt}]')])
    else:
        cnf = And(*[Or(*map(lambda sol: Not(symbols(str(sol))) if models[trc_cnf][sol] else symbols(str(sol)), models[trc_cnf]))
                    for trc_cnf in range(len(models))])
    return cnf


# DEF:  prime implicants computation.

[docs]
def prime_implicants(formula, kept: Callable = lambda lit: not firstsymbol(lit).name.startswith(TEITSIN), max_solutions:int = sys.maxsize, trace: bool = False, solver: type = SOLVER) -> frozenset:
    """
    Compute all the prime implicants of a propositional formula where the literals are filtered by kept function.

    :param formula: The input formula. The formula does not need to be in CNF.
    :type formula: Sympy formula
    :param kept: Predicate selecting the literals that are kept in the solutions (Default: function discarding the Tseitin working variables)
    :type kept: function
    :param max_solutions: maximal number of solutions (Default sys.maxsize)
    :type max_solutions: int
    :param trace: a Boolean flag determining whether the trace showing the resolution is activated (Default: False).
    :type trace: bool
    :param solver: The solver to use (Default: Pulp solver).
    :type solver: solver function
    :return: all the prime implicants in the form of a set of sets where each subset represents one prime implicant filtered by kept.
    :rtype: frozenset
    """
    global prime_implicants_problem
    global nb_implicants
    # The prime implicants method is based on linear integer programming.
    # The prime implicants are the solutions to solving this integral system.
    # References:
    # Pizzuti, Clara - "Computing prime implicants by integer programming."
    # In: Proceedings Eighth IEEE International Conference on Tools with Artificial Intelligence.
    # IEEE, 1996.
    #
    # Manquinho, V. M., Oliveira, A. L., & Marques-Silva, J. (1998, September).
    # "Models and algorithms for computing minimum-size prime implicants."
    # In Proceedings of the International Workshop on Boolean Problems.

    cnf = formula if is_cnf(formula) else tseitin_cnf(formula)  # Convert the dnf into CNF by the Tseitin method if needed.

    #  Gather all literals from CNF.
    literals = {lit for clause in cnf2clauses(cnf) for lit in clause2literals(clause)}

    # Find the critical variables where a literal and its negation both occur in the CNF formula.
    negvars = {lit for lit in literals if isinstance(lit, Not)}
    posvars = literals - negvars
    negvars = set(map(firstsymbol, negvars))  # Extract the variables from the negative literals.
    criticalvars = posvars & negvars  # Critical variables occurring positively and negatively in the formula.

    # Create a dictionary associating the literals to their Boolean pulp variable of the same name.
    # This dictionary is used to convert the literals into pulp variables (vlit[lit])
    vlit = {lit: pulp.LpVariable(str(lit), lowBound=0, upBound=1, cat=pulp.LpInteger) for lit in literals}

    if trace: tqdm.write("\rBooN PI >> Initialize prime implicants solving.", end="")
    # Initialize the prime implicants problem in pulp.
    primes = pulp.LpProblem("Prime_Implicants", pulp.LpMinimize)
    if trace: tqdm.write("\rBooN PI >> Prime implicants problem initialized.", end="")

    # Objective function = sum of all literals selected by kept function.
    objective_function = pulp.lpSum([vlit[lit] for lit in literals if kept(lit)])
    primes += objective_function

    # Get the sequence of clauses of the CNF.
    clauses = cnf2clauses(cnf)

    # Define the clauses as constraints x |~y | z  --> x + ~y + z >= 1.
    for i, clause in enumerate(clauses):  # Extract the literals of the current clause.
        literals_clause = clause2literals(clause)
        # Transform the current clause into constraints
        primes += pulp.lpSum([vlit[literal] for literal in literals_clause]) >= 1, "CLAUSE_" + str(i)

    # Define the exclusive choice constraint between a variable and its negation for critical variables, i.e., x + ~x <= 1.
    for var in criticalvars:
        primes += vlit[var] + vlit[Not(var)] <= 1, "EXCLUSION_" + var.name.strip()

    if trace: tqdm.write("\rBooN PI >> Solve.                                  ", end="")
    # Find all the solutions until no solutions are found or their number exceeds max_solutions.
    solutions = set()
    status = pulp.LpStatusOptimal
    nb_implicants = 0
    while status == pulp.LpStatusOptimal and nb_implicants < max_solutions :  # while a solution is found

        primes.solve(solver(msg=0))  # Quiet solving
        status = primes.status
        if status == pulp.LpStatusOptimal: # A solution is found then convert it into a set of prime implicants.
            nb_implicants +=1
            if trace: tqdm.write(f'\rBooN PI >> # solutions:[{nb_implicants:3d}]                           ', end='')
            solution = frozenset({lit for lit in literals if kept(lit) and vlit[lit].varValue == 1.})
            solutions.add(solution)

            # Add the constraint discarding the found solution, e.g.  s = {x, ~y, z} -> x+~y+z <= 2 s.t. len(s)-1 = 2.
            discard_solution = pulp.lpSum(map(lambda lit: vlit[lit], solution)) <= len(solution) - 1, "OUT_" + str(nb_implicants)
            primes += discard_solution
    prime_implicants_problem = primes  # keep the specification of the problem in a global variable.
    if trace: tqdm.write('')
    return frozenset(solutions)