This repository has been archived on 2023-08-20. You can view files and clone it, but cannot push or open issues or pull requests.
yap-6.3/packages/CLPBN/horus/FactorGraph.cpp

457 lines
11 KiB
C++
Raw Normal View History

2012-05-23 14:56:01 +01:00
#include <set>
#include <vector>
#include <algorithm>
#include <iostream>
#include <fstream>
#include <sstream>
#include "FactorGraph.h"
#include "Factor.h"
#include "BayesNet.h"
#include "BayesBall.h"
#include "Util.h"
FactorGraph::FactorGraph (const FactorGraph& fg)
{
const VarNodes& varNodes = fg.varNodes();
2012-05-24 22:55:20 +01:00
for (size_t i = 0; i < varNodes.size(); i++) {
2012-05-23 14:56:01 +01:00
addVarNode (new VarNode (varNodes[i]));
}
const FacNodes& facNodes = fg.facNodes();
2012-05-24 22:55:20 +01:00
for (size_t i = 0; i < facNodes.size(); i++) {
2012-05-23 14:56:01 +01:00
FacNode* facNode = new FacNode (facNodes[i]->factor());
addFacNode (facNode);
const VarNodes& neighs = facNodes[i]->neighbors();
2012-05-24 22:55:20 +01:00
for (size_t j = 0; j < neighs.size(); j++) {
2012-05-23 14:56:01 +01:00
addEdge (varNodes_[neighs[j]->getIndex()], facNode);
}
}
bayesFactors_ = fg.bayesianFactors();
2012-05-23 14:56:01 +01:00
}
void
FactorGraph::readFromUaiFormat (const char* fileName)
{
std::ifstream is (fileName);
if (!is.is_open()) {
cerr << "error: cannot read from file " << fileName << endl;
abort();
}
ignoreLines (is);
string line;
getline (is, line);
if (line != "MARKOV") {
cerr << "error: the network must be a MARKOV network " << endl;
abort();
}
// read the number of vars
ignoreLines (is);
unsigned nrVars;
is >> nrVars;
// read the range of each var
ignoreLines (is);
Ranges ranges (nrVars);
for (unsigned i = 0; i < nrVars; i++) {
is >> ranges[i];
}
unsigned nrFactors;
unsigned nrArgs;
unsigned vid;
is >> nrFactors;
vector<VarIds> factorVarIds;
vector<Ranges> factorRanges;
for (unsigned i = 0; i < nrFactors; i++) {
ignoreLines (is);
is >> nrArgs;
factorVarIds.push_back ({ });
factorRanges.push_back ({ });
for (unsigned j = 0; j < nrArgs; j++) {
is >> vid;
if (vid >= ranges.size()) {
cerr << "error: invalid variable identifier `" << vid << "'" << endl;
cerr << "identifiers must be between 0 and " << ranges.size() - 1 ;
cerr << endl;
abort();
}
factorVarIds.back().push_back (vid);
factorRanges.back().push_back (ranges[vid]);
}
}
// read the parameters
unsigned nrParams;
for (unsigned i = 0; i < nrFactors; i++) {
ignoreLines (is);
is >> nrParams;
2012-05-24 16:14:13 +01:00
if (nrParams != Util::sizeExpected (factorRanges[i])) {
2012-05-23 14:56:01 +01:00
cerr << "error: invalid number of parameters for factor nº " << i ;
2012-05-24 16:14:13 +01:00
cerr << ", expected: " << Util::sizeExpected (factorRanges[i]);
2012-05-23 14:56:01 +01:00
cerr << ", given: " << nrParams << endl;
abort();
}
Params params (nrParams);
for (unsigned j = 0; j < nrParams; j++) {
is >> params[j];
}
if (Globals::logDomain) {
2012-05-24 16:14:13 +01:00
Util::log (params);
2012-05-23 14:56:01 +01:00
}
addFactor (Factor (factorVarIds[i], factorRanges[i], params));
}
is.close();
}
void
FactorGraph::readFromLibDaiFormat (const char* fileName)
{
std::ifstream is (fileName);
if (!is.is_open()) {
cerr << "error: cannot read from file " << fileName << endl;
abort();
}
ignoreLines (is);
unsigned nrFactors;
unsigned nrArgs;
VarId vid;
is >> nrFactors;
for (unsigned i = 0; i < nrFactors; i++) {
ignoreLines (is);
// read the factor arguments
is >> nrArgs;
VarIds vids;
for (unsigned j = 0; j < nrArgs; j++) {
ignoreLines (is);
is >> vid;
vids.push_back (vid);
}
// read ranges
Ranges ranges (nrArgs);
for (unsigned j = 0; j < nrArgs; j++) {
ignoreLines (is);
is >> ranges[j];
VarNode* var = getVarNode (vids[j]);
if (var != 0 && ranges[j] != var->range()) {
cerr << "error: variable `" << vids[j] << "' appears in two or " ;
cerr << "more factors with a different range" << endl;
}
}
// read parameters
ignoreLines (is);
unsigned nNonzeros;
is >> nNonzeros;
2012-05-24 16:14:13 +01:00
Params params (Util::sizeExpected (ranges), 0);
2012-05-23 14:56:01 +01:00
for (unsigned j = 0; j < nNonzeros; j++) {
ignoreLines (is);
unsigned index;
is >> index;
ignoreLines (is);
double val;
is >> val;
params[index] = val;
}
if (Globals::logDomain) {
2012-05-24 16:14:13 +01:00
Util::log (params);
2012-05-23 14:56:01 +01:00
}
2012-05-28 14:42:20 +01:00
std::reverse (vids.begin(), vids.end());
2012-05-23 14:56:01 +01:00
Factor f (vids, ranges, params);
2012-05-28 14:42:20 +01:00
std::reverse (vids.begin(), vids.end());
2012-05-23 14:56:01 +01:00
f.reorderArguments (vids);
addFactor (f);
}
is.close();
}
FactorGraph::~FactorGraph (void)
{
2012-05-24 22:55:20 +01:00
for (size_t i = 0; i < varNodes_.size(); i++) {
2012-05-23 14:56:01 +01:00
delete varNodes_[i];
}
2012-05-24 22:55:20 +01:00
for (size_t i = 0; i < facNodes_.size(); i++) {
2012-05-23 14:56:01 +01:00
delete facNodes_[i];
}
}
void
FactorGraph::addFactor (const Factor& factor)
{
FacNode* fn = new FacNode (factor);
addFacNode (fn);
const VarIds& vids = fn->factor().arguments();
2012-05-24 22:55:20 +01:00
for (size_t i = 0; i < vids.size(); i++) {
2012-05-23 14:56:01 +01:00
VarMap::const_iterator it = varMap_.find (vids[i]);
if (it != varMap_.end()) {
addEdge (it->second, fn);
} else {
VarNode* vn = new VarNode (vids[i], fn->factor().range (i));
addVarNode (vn);
addEdge (vn, fn);
}
}
}
void
FactorGraph::addVarNode (VarNode* vn)
{
varNodes_.push_back (vn);
vn->setIndex (varNodes_.size() - 1);
varMap_.insert (make_pair (vn->varId(), vn));
}
void
FactorGraph::addFacNode (FacNode* fn)
{
facNodes_.push_back (fn);
fn->setIndex (facNodes_.size() - 1);
}
void
FactorGraph::addEdge (VarNode* vn, FacNode* fn)
{
vn->addNeighbor (fn);
fn->addNeighbor (vn);
}
bool
FactorGraph::isTree (void) const
{
return !containsCycle();
}
DAGraph&
FactorGraph::getStructure (void)
{
assert (bayesFactors_);
2012-05-23 14:56:01 +01:00
if (structure_.empty()) {
2012-05-24 22:55:20 +01:00
for (size_t i = 0; i < varNodes_.size(); i++) {
2012-05-23 14:56:01 +01:00
structure_.addNode (new DAGraphNode (varNodes_[i]));
}
2012-05-24 22:55:20 +01:00
for (size_t i = 0; i < facNodes_.size(); i++) {
2012-05-23 14:56:01 +01:00
const VarIds& vids = facNodes_[i]->factor().arguments();
2012-05-24 22:55:20 +01:00
for (size_t j = 1; j < vids.size(); j++) {
2012-05-23 14:56:01 +01:00
structure_.addEdge (vids[j], vids[0]);
}
}
}
return structure_;
}
void
FactorGraph::print (void) const
{
2012-05-24 22:55:20 +01:00
for (size_t i = 0; i < varNodes_.size(); i++) {
2012-05-23 14:56:01 +01:00
cout << "var id = " << varNodes_[i]->varId() << endl;
cout << "label = " << varNodes_[i]->label() << endl;
cout << "range = " << varNodes_[i]->range() << endl;
cout << "evidence = " << varNodes_[i]->getEvidence() << endl;
cout << "factors = " ;
2012-05-24 22:55:20 +01:00
for (size_t j = 0; j < varNodes_[i]->neighbors().size(); j++) {
2012-05-23 14:56:01 +01:00
cout << varNodes_[i]->neighbors()[j]->getLabel() << " " ;
}
cout << endl << endl;
}
2012-05-24 22:55:20 +01:00
for (size_t i = 0; i < facNodes_.size(); i++) {
2012-05-23 14:56:01 +01:00
facNodes_[i]->factor().print();
}
}
void
FactorGraph::exportToGraphViz (const char* fileName) const
{
ofstream out (fileName);
if (!out.is_open()) {
cerr << "error: cannot open file to write at " ;
cerr << "FactorGraph::exportToDotFile()" << endl;
abort();
}
out << "graph \"" << fileName << "\" {" << endl;
2012-05-24 22:55:20 +01:00
for (size_t i = 0; i < varNodes_.size(); i++) {
2012-05-23 14:56:01 +01:00
if (varNodes_[i]->hasEvidence()) {
out << '"' << varNodes_[i]->label() << '"' ;
out << " [style=filled, fillcolor=yellow]" << endl;
}
}
2012-05-24 22:55:20 +01:00
for (size_t i = 0; i < facNodes_.size(); i++) {
2012-05-23 14:56:01 +01:00
out << '"' << facNodes_[i]->getLabel() << '"' ;
out << " [label=\"" << facNodes_[i]->getLabel();
out << "\"" << ", shape=box]" << endl;
}
2012-05-24 22:55:20 +01:00
for (size_t i = 0; i < facNodes_.size(); i++) {
2012-05-23 14:56:01 +01:00
const VarNodes& myVars = facNodes_[i]->neighbors();
2012-05-24 22:55:20 +01:00
for (size_t j = 0; j < myVars.size(); j++) {
2012-05-23 14:56:01 +01:00
out << '"' << facNodes_[i]->getLabel() << '"' ;
out << " -- " ;
out << '"' << myVars[j]->label() << '"' << endl;
}
}
out << "}" << endl;
out.close();
}
void
FactorGraph::exportToUaiFormat (const char* fileName) const
{
ofstream out (fileName);
if (!out.is_open()) {
cerr << "error: cannot open file " << fileName << endl;
abort();
}
out << "MARKOV" << endl;
out << varNodes_.size() << endl;
2012-05-28 17:00:46 +01:00
VarNodes sortedVns = varNodes_;
std::sort (sortedVns.begin(), sortedVns.end(), sortByVarId());
for (size_t i = 0; i < sortedVns.size(); i++) {
out << ((i != 0) ? " " : "") << sortedVns[i]->range();
2012-05-23 14:56:01 +01:00
}
2012-05-28 17:00:46 +01:00
out << endl << facNodes_.size() << endl;
2012-05-24 22:55:20 +01:00
for (size_t i = 0; i < facNodes_.size(); i++) {
2012-05-28 17:00:46 +01:00
VarIds args = facNodes_[i]->factor().arguments();
out << args.size() << " " << Util::elementsToString (args) << endl;
2012-05-23 14:56:01 +01:00
}
2012-05-28 17:00:46 +01:00
out << endl;
2012-05-24 22:55:20 +01:00
for (size_t i = 0; i < facNodes_.size(); i++) {
2012-05-23 14:56:01 +01:00
Params params = facNodes_[i]->factor().params();
if (Globals::logDomain) {
2012-05-24 16:14:13 +01:00
Util::exp (params);
2012-05-23 14:56:01 +01:00
}
2012-05-28 17:00:46 +01:00
out << params.size() << endl << " " ;
out << Util::elementsToString (params) << endl << endl;
2012-05-23 14:56:01 +01:00
}
out.close();
}
void
FactorGraph::exportToLibDaiFormat (const char* fileName) const
{
ofstream out (fileName);
if (!out.is_open()) {
cerr << "error: cannot open file " << fileName << endl;
abort();
}
out << facNodes_.size() << endl << endl;
2012-05-24 22:55:20 +01:00
for (size_t i = 0; i < facNodes_.size(); i++) {
2012-05-28 14:42:20 +01:00
Factor f (facNodes_[i]->factor());
out << f.nrArguments() << endl;
2012-05-28 17:00:46 +01:00
out << Util::elementsToString (f.arguments()) << endl;
out << Util::elementsToString (f.ranges()) << endl;
2012-05-28 14:42:20 +01:00
VarIds args = f.arguments();
std::reverse (args.begin(), args.end());
f.reorderArguments (args);
2012-05-23 14:56:01 +01:00
if (Globals::logDomain) {
2012-05-28 14:42:20 +01:00
Util::exp (f.params());
2012-05-23 14:56:01 +01:00
}
2012-05-28 14:42:20 +01:00
out << f.size() << endl;
for (size_t j = 0; j < f.size(); j++) {
out << j << " " << f[j] << endl;
2012-05-23 14:56:01 +01:00
}
out << endl;
}
out.close();
}
void
FactorGraph::ignoreLines (std::ifstream& is) const
{
string ignoreStr;
while (is.peek() == '#' || is.peek() == '\n') {
getline (is, ignoreStr);
}
}
bool
FactorGraph::containsCycle (void) const
{
vector<bool> visitedVars (varNodes_.size(), false);
vector<bool> visitedFactors (facNodes_.size(), false);
2012-05-24 22:55:20 +01:00
for (size_t i = 0; i < varNodes_.size(); i++) {
2012-05-23 14:56:01 +01:00
int v = varNodes_[i]->getIndex();
if (!visitedVars[v]) {
if (containsCycle (varNodes_[i], 0, visitedVars, visitedFactors)) {
return true;
}
}
}
return false;
}
bool
FactorGraph::containsCycle (
const VarNode* v,
const FacNode* p,
vector<bool>& visitedVars,
vector<bool>& visitedFactors) const
{
visitedVars[v->getIndex()] = true;
const FacNodes& adjacencies = v->neighbors();
2012-05-24 22:55:20 +01:00
for (size_t i = 0; i < adjacencies.size(); i++) {
2012-05-23 14:56:01 +01:00
int w = adjacencies[i]->getIndex();
if (!visitedFactors[w]) {
if (containsCycle (adjacencies[i], v, visitedVars, visitedFactors)) {
return true;
}
}
else if (visitedFactors[w] && adjacencies[i] != p) {
return true;
}
}
return false; // no cycle detected in this component
}
bool
FactorGraph::containsCycle (
const FacNode* v,
const VarNode* p,
vector<bool>& visitedVars,
vector<bool>& visitedFactors) const
{
visitedFactors[v->getIndex()] = true;
const VarNodes& adjacencies = v->neighbors();
2012-05-24 22:55:20 +01:00
for (size_t i = 0; i < adjacencies.size(); i++) {
2012-05-23 14:56:01 +01:00
int w = adjacencies[i]->getIndex();
if (!visitedVars[w]) {
if (containsCycle (adjacencies[i], v, visitedVars, visitedFactors)) {
return true;
}
}
else if (visitedVars[w] && adjacencies[i] != p) {
return true;
}
}
return false; // no cycle detected in this component
}