edu.cmu.tetrad.search.Fas Maven / Gradle / Ivy

Show more of this group Show more artifacts with this name
Show all versions of tetrad-lib Show documentation
There is a newer version: 7.6.5
///////////////////////////////////////////////////////////////////////////////
// For information as to what this class does, see the Javadoc, below.       //
// Copyright (C) 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006,       //
// 2007, 2008, 2009, 2010, 2014 by Peter Spirtes, Richard Scheines, Joseph   //
// Ramsey, and Clark Glymour.                                                //
//                                                                           //
// This program is free software; you can redistribute it and/or modify      //
// it under the terms of the GNU General Public License as published by      //
// the Free Software Foundation; either version 2 of the License, or         //
// (at your option) any later version.                                       //
//                                                                           //
// This program is distributed in the hope that it will be useful,           //
// but WITHOUT ANY WARRANTY; without even the implied warranty of            //
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the             //
// GNU General Public License for more details.                              //
//                                                                           //
// You should have received a copy of the GNU General Public License         //
// along with this program; if not, write to the Free Software               //
// Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA //
///////////////////////////////////////////////////////////////////////////////

package edu.cmu.tetrad.search;

import edu.cmu.tetrad.data.Knowledge;
import edu.cmu.tetrad.graph.*;
import edu.cmu.tetrad.search.test.IndependenceResult;
import edu.cmu.tetrad.search.utils.PcCommon;
import edu.cmu.tetrad.search.utils.SepsetMap;
import edu.cmu.tetrad.util.ChoiceGenerator;
import edu.cmu.tetrad.util.MillisecondTimes;
import edu.cmu.tetrad.util.TetradLogger;

import java.io.PrintStream;
import java.util.*;

/**
 * Implements the Fast Adjacency Search (FAS), which is the adjacency search of the PC algorithm (see). This is a
 * useful algorithm in many contexts, including as the first step of FCI (see).
 *
 * The idea of FAS is that at a given stage of the search, an edge X*-*Y is removed from the
 * graph if X _||_ Y | S, where S is a subset of size d either of adj(X) or of adj(Y), where d is the depth of the
 * search. The fast adjacency search performs this procedure for each pair of adjacent edges in the graph and for each
 * depth d = 0, 1, 2, ..., d1, where d1 is either the maximum depth or else the first such depth at which no edges can
 * be removed. The interpretation of this adjacency search is different for different algorithm, depending on the
 * assumptions of the algorithm. A mapping from {x, y} to S({x, y}) is returned for edges x *-* y that have been
 * removed.
 *
 * FAS may optionally use a heuristic from Causation, Prediction and Search, which (like PC-Stable)
 * renders the output invariant to the order of the input variables.
 *
 * This algorithm was described in the earlier edition of this book:
 *
 * Spirtes, P., Glymour, C. N., Scheines, R., & Heckerman, D. (2000). Causation, prediction, and search. MIT
 * press.
 *
 * This class is configured to respect knowledge of forbidden and required edges, including knowledge of temporal
 * tiers.
 *
 * @author peterspirtes
 * @author clarkglymour
 * @author josephramsey.
 * @see Pc
 * @see Fci
 * @see Knowledge
 */
public class Fas implements IFas {
    private final IndependenceTest test;
    private final TetradLogger logger = TetradLogger.getInstance();
    private Knowledge knowledge = new Knowledge();
    private int numIndependenceTests;
    private SepsetMap sepset = new SepsetMap();
    private PcCommon.PcHeuristicType heuristic = PcCommon.PcHeuristicType.NONE;
    private int depth = 1000;
    private boolean stable = true;
    private long elapsedTime = 0L;
    private PrintStream out = System.out;
    private boolean verbose = false;


    /**
     * Constructor.
     *
     * @param test The test to use for oracle conditional independence test results.
     */
    public Fas(IndependenceTest test) {
        this.test = test;
    }


    /**
     * Runs the search and returns the resulting (undirected) graph.
     *
     * @return This graph.
     */
    @Override
    public Graph search() {
        return search(test.getVariables());
    }

    /**
     * Discovers all adjacencies in data.  The procedure is to remove edges in the graph which connect pairs of
     * variables which are independent, conditional on some other set of variables in the graph (the "sepset"). These are
     * removed in tiers.  First, edges which are independent conditional on zero other variables are removed, then edges
     * which are independent conditional on one other variable are removed, then two, then three, and so on, until no
     * more edges can be removed from the graph.  The edges which remain in the graph after this procedure are the
     * adjacencies in the data.
     *
     * @param nodes A list of nodes to search over.
     * @return An undirected graph that summarizes the conditional independencies that obtain in the data.
     */
    public Graph search(List nodes) {
        long startTime = MillisecondTimes.timeMillis();
        nodes = new ArrayList<>(nodes);

        this.logger.addOutputStream(out);

        if (verbose) {
            this.logger.forceLogMessage("Starting Fast Adjacency Search.");
        }

        this.test.setVerbose(this.verbose);

        int _depth = this.depth;

        if (_depth == -1) {
            _depth = 1000;
        }

        this.sepset = new SepsetMap();

        List edges = new ArrayList<>();
        Map scores = new HashMap<>();

        if (this.heuristic == PcCommon.PcHeuristicType.HEURISTIC_1) {
            Collections.sort(nodes);
        }

        for (int i = 0; i < nodes.size(); i++) {
            for (int j = i + 1; j < nodes.size(); j++) {
                edges.add(Edges.undirectedEdge(nodes.get(i), nodes.get(j)));
            }
        }

        for (Edge edge : edges) {
            IndependenceResult result = this.test.checkIndependence(edge.getNode1(), edge.getNode2(), new HashSet<>());
            scores.put(edge, result.getScore());
        }

        if (this.heuristic == PcCommon.PcHeuristicType.HEURISTIC_2 || this.heuristic == PcCommon.PcHeuristicType.HEURISTIC_3) {
            edges.sort(Comparator.comparing(scores::get));
        }

        Map> adjacencies = new HashMap<>();

        for (Node node : nodes) {
            Set set = new LinkedHashSet<>();

            for (Node _node : nodes) {
                if (_node == node) continue;
                set.add(_node);
            }

            adjacencies.put(node, set);
        }

        for (Edge edge : new ArrayList<>(edges)) {
            if (scores.get(edge) != null && scores.get(edge) < 0
                    || (this.knowledge.isForbidden(edge.getNode1().getName(), edge.getNode2().getName())
                    && (this.knowledge.isForbidden(edge.getNode2().getName(), edge.getNode1().getName())))) {
                edges.remove(edge);
                adjacencies.get(edge.getNode1()).remove(edge.getNode2());
                adjacencies.get(edge.getNode2()).remove(edge.getNode1());
                this.sepset.set(edge.getNode1(), edge.getNode2(), new HashSet<>());
            }
        }

        for (int d = 0; d <= _depth; d++) {
            System.out.println("Depth: " + d);

            boolean more;

            if (this.stable) {
                Map> adjacenciesCopy = new HashMap<>();

                for (Node node : adjacencies.keySet()) {
                    adjacenciesCopy.put(node, new LinkedHashSet<>(adjacencies.get(node)));
                }

                adjacencies = adjacenciesCopy;
            }

            more = searchAtDepth(scores, edges, this.test, adjacencies, d);

            if (!more) {
                break;
            }
        }

        // The search graph. It is assumed going in that all the true adjacencies of x are in this graph for every node
        // x. It is hoped (i.e., true in the large sample limit) that true adjacencies are never removed.
        Graph graph = new EdgeListGraph(nodes);

        for (int i = 0; i < nodes.size(); i++) {
            for (int j = i + 1; j < nodes.size(); j++) {
                Node x = nodes.get(i);
                Node y = nodes.get(j);

                if (adjacencies.get(x).contains(y)) {
                    graph.addUndirectedEdge(x, y);
                }
            }
        }

        if (verbose) {
            this.logger.forceLogMessage("Finishing Fast Adjacency Search.");
        }

        this.elapsedTime = MillisecondTimes.timeMillis() - startTime;

        return graph;
    }

    /**
     * Sets the depth of the search, which is the maximum number of variables that ben be conditioned on in any
     * conditional independence test.
     *
     * @param depth This maximum.
     */
    public void setDepth(int depth) {
        if (depth < -1) {
            throw new IllegalArgumentException(
                    "Depth must be -1 (unlimited) or >= 0.");
        }

        this.depth = depth;
    }

    /**
     * Sets the knowledge to be used in the search.
     *
     * @param knowledge This knowledge.
     * @see Knowledge
     */
    public void setKnowledge(Knowledge knowledge) {
        this.knowledge = new Knowledge(knowledge);
    }

    /**
     * Returns the number of independence tests that were done.
     *
     * @return This number.
     */
    public int getNumIndependenceTests() {
        return this.numIndependenceTests;
    }

    /**
     * Returns the sepsets that were discovered in the search. A 'sepset' for test X _||_ Y | Z1,...,Zm would be
     * {Z1,...,Zm}
     *
     * @return A map of these sepsets indexed by {X, Y}.
     */
    public SepsetMap getSepsets() {
        return this.sepset;
    }

    /**
     * Sets whether verbose output should be printed.
     *
     * @param verbose True iff the case.
     */
    public void setVerbose(boolean verbose) {
        this.verbose = verbose;
    }

    /**
     * Returns the elapsed time of the search.
     *
     * @return This elapsed time.
     */
    public long getElapsedTime() {
        return elapsedTime;
    }

    /**
     * Returns the nodes from the test.
     *
     * @return These nodes.
     */
    @Override
    public List getNodes() {
        return this.test.getVariables();
    }

    /**
     * There are no ambiguous triples for this search, for any nodes.
     *
     * @param node The nodes in question.
     * @return An empty list.
     */
    @Override
    public List getAmbiguousTriples(Node node) {
        return new ArrayList<>();
    }

    /**
     * @param out This print stream.
     */
    @Override
    public void setOut(PrintStream out) {
        this.out = out;
    }

    /**
     * @param pcHeuristic Which PC heuristic to use (see Causation, Prediction and Search). Default is
     *                    PcHeuristicType.NONE.
     * @see PcCommon.PcHeuristicType
     */
    public void setPcHeuristicType(PcCommon.PcHeuristicType pcHeuristic) {
        this.heuristic = pcHeuristic;
    }

    /**
     * Sets whether the stable adjacency search should be used. Default is false. Default is false. See the
     * following reference for this:
     *
     * Colombo, D., & Maathuis, M. H. (2014). Order-independent constraint-based causal structure learning. J. Mach.
     * Learn. Res., 15(1), 3741-3782.
     *
     * @param stable True iff the case.
     */
    public void setStable(boolean stable) {
        this.stable = stable;
    }

    //==============================PRIVATE METHODS======================/

    private int freeDegree(Map> adjacencies) {
        int max = 0;

        for (Node x : adjacencies.keySet()) {
            Set opposites = adjacencies.get(x);

            for (Node y : opposites) {
                Set adjx = new LinkedHashSet<>(opposites);
                adjx.remove(y);

                if (adjx.size() > max) {
                    max = adjx.size();
                }
            }
        }

        return max;
    }

    private boolean searchAtDepth(Map scores, List edges, IndependenceTest test, Map> adjacencies, int depth) {

        for (Edge edge : edges) {
            Node x = edge.getNode1();
            Node y = edge.getNode2();

            if (Thread.currentThread().isInterrupted()) {
                break;
            }

            boolean b = checkSide(scores, test, adjacencies, depth, x, y);
            if (!b) checkSide(scores, test, adjacencies, depth, y, x);
        }

        return freeDegree(adjacencies) > depth;
    }

    private boolean checkSide(Map scores, IndependenceTest test, Map> adjacencies, int depth, Node x, Node y) {
        if (!adjacencies.get(x).contains(y)) return false;

        List _adjx = new ArrayList<>(adjacencies.get(x));
        _adjx.remove(y);

        if (this.heuristic == PcCommon.PcHeuristicType.HEURISTIC_1 || this.heuristic == PcCommon.PcHeuristicType.HEURISTIC_2) {
            Collections.sort(_adjx);
        }

        List ppx = possibleParents(x, _adjx, this.knowledge, y);

        Map scores2 = new HashMap<>();

        for (Node node : ppx) {
            Double _score = scores.get(Edges.undirectedEdge(node, x));
            scores2.put(node, _score);
        }

        if (this.heuristic == PcCommon.PcHeuristicType.HEURISTIC_3) {
            ppx.sort(Comparator.comparing(scores2::get));
            Collections.reverse(ppx);
        }

        if (ppx.size() >= depth) {
            ChoiceGenerator cg = new ChoiceGenerator(ppx.size(), depth);
            int[] choice;

            while ((choice = cg.next()) != null) {
                if (Thread.currentThread().isInterrupted()) {
                    break;
                }

                Set Z = GraphUtils.asSet(choice, ppx);

                this.numIndependenceTests++;

                boolean independent = test.checkIndependence(x, y, Z).isIndependent();

                boolean noEdgeRequired = this.knowledge.noEdgeRequired(x.getName(), y.getName());

                if (independent && noEdgeRequired) {
                    adjacencies.get(x).remove(y);
                    adjacencies.get(y).remove(x);

                    getSepsets().set(x, y, Z);

                    return true;
                }
            }
        }

        return false;
    }

    private List possibleParents(Node x, List adjx,
                                       Knowledge knowledge, Node y) {
        List possibleParents = new LinkedList<>();
        String _x = x.getName();

        for (Node z : adjx) {
            if (z == x) continue;
            if (z == y) continue;
            String _z = z.getName();

            if (possibleParentOf(_z, _x, knowledge)) {
                possibleParents.add(z);
            }
        }

        return possibleParents;
    }

    private boolean possibleParentOf(String z, String x, Knowledge knowledge) {
        return !knowledge.isForbidden(z, x) && !knowledge.isRequired(x, z);
    }
}