Marked the backwards compatibility edge interface of BipartiteGraph as obsolete
[libdai.git] / include / dai / bipgraph.h
1 /* Copyright (C) 2006-2008 Joris Mooij [joris dot mooij at tuebingen dot mpg dot de]
2 Radboud University Nijmegen, The Netherlands /
3 Max Planck Institute for Biological Cybernetics, Germany
4
5 This file is part of libDAI.
6
7 libDAI is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 2 of the License, or
10 (at your option) any later version.
11
12 libDAI is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
16
17 You should have received a copy of the GNU General Public License
18 along with libDAI; if not, write to the Free Software
19 Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
20 */
21
22
23 /// \file
24 /// \brief Defines BipartiteGraph class
25
26
27 #ifndef __defined_libdai_bipgraph_h
28 #define __defined_libdai_bipgraph_h
29
30
31 #include <ostream>
32 #include <vector>
33 #include <cassert>
34 #include <algorithm>
35 #include <dai/util.h>
36
37
38 namespace dai {
39
40
41 /// Represents the neighborhood structure of nodes in a bipartite graph.
42 /** A bipartite graph has two types of nodes: type 1 and type 2. Edges can occur only between
43 * nodes of different type. Nodes are indexed by an unsigned integer. If there are nr1()
44 * nodes of type 1 and nr2() nodes of type 2, the nodes of type 1 are numbered
45 * 0,1,2,...,nr1()-1 and the nodes of type 2 are numbered 0,1,2,...,nr2()-1. An edge
46 * between node \a n1 of type 1 and node \a n2 of type 2 is represented by a BipartiteGraph::Edge(\a n1,\a n2).
47 *
48 * A BipartiteGraph is implemented as a sparse adjacency list, i.e., it stores for each node a list of
49 * its neighboring nodes. In particular, it stores for each node of type 1 a vector of Neighbor structures
50 * (accessible by the nb1() method) describing the neighboring nodes of type 2; similarly, for each node
51 * of type 2 it stores a vector of Neighbor structures (accessibly by the nb2() method) describing the
52 * neighboring nodes of type 1.
53 * Thus, each node has an associated variable of type BipartiteGraph::Neighbors, which is a vector of
54 * Neighbor structures, describing its neighboring nodes of the other type.
55 * \idea Cache second-order neighborhoods in BipartiteGraph.
56 */
57 class BipartiteGraph {
58 public:
59 /// Describes the neighbor relationship of two nodes in a BipartiteGraph.
60 /** Sometimes we want to do an action, such as sending a
61 * message, for all edges in a graph. However, most graphs
62 * will be sparse, so we need some way of storing a set of
63 * the neighbors of a node, which is both fast and
64 * memory-efficient. We also need to be able to go between
65 * viewing node \a A as a neighbor of node \a B, and node \a
66 * B as a neighbor of node \a A. The Neighbor struct solves
67 * both of these problems. Each node has a list of neighbors,
68 * stored as a vector<Neighbor>, and extra information is
69 * included in the Neighbor struct which allows us to access
70 * a node as a neighbor of its neighbor (the \a dual member).
71 *
72 * By convention, variable identifiers naming indices into a
73 * vector of neighbors are prefixed with an underscore ("_").
74 * The neighbor list which they point into is then understood
75 * from context. For example:
76 *
77 * \code
78 * void BP::calcNewMessage( size_t i, size_t _I )
79 * \endcode
80 *
81 * Here, \a i is the "absolute" index of node i, but \a _I is
82 * understood as a "relative" index, giving node I's entry in
83 * nb1(i). The corresponding Neighbor structure can be
84 * accessed as nb1(i,_I) or nb1(i)[_I]. The absolute index of
85 * \a _I, which would be called \a I, can be recovered from
86 * the \a node member: nb1(i,_I).node. The \a iter member
87 * gives the relative index \a _I, and the \a dual member
88 * gives the "dual" relative index, i.e. the index of \a i in
89 * \a I's neighbor list.
90 *
91 * \code
92 * Neighbor n = nb1(i,_I);
93 * n.node == I &&
94 * n.iter == _I &&
95 * nb2(n.node,n.dual).node == i
96 * \endcode
97 *
98 * In a FactorGraph, nb1 is called nbV, and nb2 is called
99 * nbF.
100 *
101 * There is no easy way to transform a pair of absolute node
102 * indices \a i and \a I into a Neighbor structure relative
103 * to one of the nodes. Such a feature has never yet been
104 * found to be necessary. Iteration over edges can always be
105 * accomplished using the Neighbor lists, and by writing
106 * functions that accept relative indices:
107 * \code
108 * for( size_t i = 0; i < nrVars(); ++i )
109 * foreach( const Neighbor &I, nbV(i) )
110 * calcNewMessage( i, I.iter );
111 * \endcode
112 */
113 struct Neighbor {
114 /// Corresponds to the index of this Neighbor entry in the vector of neighbors
115 size_t iter;
116 /// Contains the number of the neighboring node
117 size_t node;
118 /// Contains the "dual" iter
119 size_t dual;
120
121 /// Default constructor
122 Neighbor() {}
123 /// Constructor that sets the Neighbor members according to the parameters
124 Neighbor( size_t iter, size_t node, size_t dual ) : iter(iter), node(node), dual(dual) {}
125
126 /// Cast to size_t returns node member
127 operator size_t () const { return node; }
128 };
129
130 /// Describes the neighbors of some node.
131 typedef std::vector<Neighbor> Neighbors;
132
133 /// Represents an edge: an Edge(\a n1,\a n2) corresponds to the edge between node \a n1 of type 1 and node \a n2 of type 2.
134 typedef std::pair<size_t,size_t> Edge;
135
136 private:
137 /// Contains for each node of type 1 a vector of its neighbors
138 std::vector<Neighbors> _nb1;
139
140 /// Contains for each node of type 2 a vector of its neighbors
141 std::vector<Neighbors> _nb2;
142
143 /// Used internally by isTree()
144 struct levelType {
145 std::vector<size_t> ind1; // indices of nodes of type 1
146 std::vector<size_t> ind2; // indices of nodes of type 2
147 };
148
149 /// @name Backwards compatibility layer (to be removed soon)
150 //@{
151 /// Enable backwards compatibility layer?
152 bool _edge_indexed;
153 /// Call indexEdges() first to initialize these members
154 std::vector<Edge> _edges;
155 /// Call indexEdges() first to initialize these members
156 hash_map<Edge,size_t> _vv2e;
157 //}@
158
159 public:
160 /// Default constructor (creates an empty bipartite graph)
161 BipartiteGraph() : _nb1(), _nb2(), _edge_indexed(false) {}
162
163 /// Constructs BipartiteGraph from a range of edges.
164 /** \tparam EdgeInputIterator Iterator that iterates over instances of BipartiteGraph::Edge.
165 * \param nr1 The number of nodes of type 1.
166 * \param nr2 The number of nodes of type 2.
167 * \param begin Points to the first edge.
168 * \param end Points just beyond the last edge.
169 */
170 template<typename EdgeInputIterator>
171 BipartiteGraph( size_t nr1, size_t nr2, EdgeInputIterator begin, EdgeInputIterator end ) : _nb1( nr1 ), _nb2( nr2 ), _edge_indexed(false) {
172 construct( nr1, nr2, begin, end );
173 }
174
175 /// (Re)constructs BipartiteGraph from a range of edges.
176 /** \tparam EdgeInputIterator Iterator that iterates over instances of BipartiteGraph::Edge.
177 * \param nr1 The number of nodes of type 1.
178 * \param nr2 The number of nodes of type 2.
179 * \param begin Points to the first edge.
180 * \param end Points just beyond the last edge.
181 */
182 template<typename EdgeInputIterator>
183 void construct( size_t nr1, size_t nr2, EdgeInputIterator begin, EdgeInputIterator end );
184
185 /// Returns constant reference to the _i2'th neighbor of node i1 of type 1
186 const Neighbor & nb1( size_t i1, size_t _i2 ) const {
187 #ifdef DAI_DEBUG
188 assert( i1 < _nb1.size() );
189 assert( _i2 < _nb1[i1].size() );
190 #endif
191 return _nb1[i1][_i2];
192 }
193 /// Returns reference to the _i2'th neighbor of node i1 of type 1
194 Neighbor & nb1( size_t i1, size_t _i2 ) {
195 #ifdef DAI_DEBUG
196 assert( i1 < _nb1.size() );
197 assert( _i2 < _nb1[i1].size() );
198 #endif
199 return _nb1[i1][_i2];
200 }
201
202 /// Returns constant reference to the _i1'th neighbor of node i2 of type 2
203 const Neighbor & nb2( size_t i2, size_t _i1 ) const {
204 #ifdef DAI_DEBUG
205 assert( i2 < _nb2.size() );
206 assert( _i1 < _nb2[i2].size() );
207 #endif
208 return _nb2[i2][_i1];
209 }
210 /// Returns reference to the _i1'th neighbor of node i2 of type 2
211 Neighbor & nb2( size_t i2, size_t _i1 ) {
212 #ifdef DAI_DEBUG
213 assert( i2 < _nb2.size() );
214 assert( _i1 < _nb2[i2].size() );
215 #endif
216 return _nb2[i2][_i1];
217 }
218
219 /// Returns constant reference to all neighbors of node i1 of type 1
220 const Neighbors & nb1( size_t i1 ) const {
221 #ifdef DAI_DEBUG
222 assert( i1 < _nb1.size() );
223 #endif
224 return _nb1[i1];
225 }
226 /// Returns reference to all neighbors of node of i1 type 1
227 Neighbors & nb1( size_t i1 ) {
228 #ifdef DAI_DEBUG
229 assert( i1 < _nb1.size() );
230 #endif
231 return _nb1[i1];
232 }
233
234 /// Returns constant reference to all neighbors of node i2 of type 2
235 const Neighbors & nb2( size_t i2 ) const {
236 #ifdef DAI_DEBUG
237 assert( i2 < _nb2.size() );
238 #endif
239 return _nb2[i2];
240 }
241 /// Returns reference to all neighbors of node i2 of type 2
242 Neighbors & nb2( size_t i2 ) {
243 #ifdef DAI_DEBUG
244 assert( i2 < _nb2.size() );
245 #endif
246 return _nb2[i2];
247 }
248
249 /// Returns number of nodes of type 1
250 size_t nr1() const { return _nb1.size(); }
251 /// Returns number of nodes of type 2
252 size_t nr2() const { return _nb2.size(); }
253
254 /// Calculates the number of edges, time complexity: O(nr1())
255 size_t nrEdges() const {
256 size_t sum = 0;
257 for( size_t i1 = 0; i1 < nr1(); i1++ )
258 sum += nb1(i1).size();
259 return sum;
260 }
261
262 /// Adds a node of type 1 without neighbors.
263 void add1() { _nb1.push_back( Neighbors() ); }
264
265 /// Adds a node of type 2 without neighbors.
266 void add2() { _nb2.push_back( Neighbors() ); }
267
268 /// Adds a node of type 1, with neighbors specified by a range of nodes of type 2.
269 /** \tparam NodeInputIterator Iterator that iterates over instances of size_t.
270 * \param begin Points to the first index of the nodes of type 2 that should become neighbors of the added node.
271 * \param end Points just beyond the last index of the nodes of type 2 that should become neighbors of the added node.
272 * \param sizeHint For improved efficiency, the size of the range may be specified by sizeHint.
273 */
274 template <typename NodeInputIterator>
275 void add1( NodeInputIterator begin, NodeInputIterator end, size_t sizeHint = 0 ) {
276 Neighbors nbs1new;
277 nbs1new.reserve( sizeHint );
278 size_t iter = 0;
279 for( NodeInputIterator it = begin; it != end; ++it ) {
280 assert( *it < nr2() );
281 Neighbor nb1new( iter, *it, nb2(*it).size() );
282 Neighbor nb2new( nb2(*it).size(), nr1(), iter++ );
283 nbs1new.push_back( nb1new );
284 nb2( *it ).push_back( nb2new );
285 }
286 _nb1.push_back( nbs1new );
287 }
288
289 /// Adds a node of type 2, with neighbors specified by a range of nodes of type 1.
290 /** \tparam NodeInputIterator Iterator that iterates over instances of size_t.
291 * \param begin Points to the first index of the nodes of type 1 that should become neighbors of the added node.
292 * \param end Points just beyond the last index of the nodes of type 1 that should become neighbors of the added node.
293 * \param sizeHint For improved efficiency, the size of the range may be specified by sizeHint.
294 */
295 template <typename NodeInputIterator>
296 void add2( NodeInputIterator begin, NodeInputIterator end, size_t sizeHint = 0 ) {
297 Neighbors nbs2new;
298 nbs2new.reserve( sizeHint );
299 size_t iter = 0;
300 for( NodeInputIterator it = begin; it != end; ++it ) {
301 assert( *it < nr1() );
302 Neighbor nb2new( iter, *it, nb1(*it).size() );
303 Neighbor nb1new( nb1(*it).size(), nr2(), iter++ );
304 nbs2new.push_back( nb2new );
305 nb1( *it ).push_back( nb1new );
306 }
307 _nb2.push_back( nbs2new );
308 }
309
310 /// Removes node n1 of type 1 and all incident edges.
311 void erase1( size_t n1 );
312
313 /// Removes node n2 of type 2 and all incident edges.
314 void erase2( size_t n2 );
315
316 /// Adds an edge between node n1 of type 1 and node n2 of type 2.
317 /** If check == true, only adds the edge if it does not exist already.
318 */
319 void addEdge( size_t n1, size_t n2, bool check = true ) {
320 assert( n1 < nr1() );
321 assert( n2 < nr2() );
322 bool exists = false;
323 if( check ) {
324 // Check whether the edge already exists
325 foreach( const Neighbor &nb2, nb1(n1) )
326 if( nb2 == n2 ) {
327 exists = true;
328 break;
329 }
330 }
331 if( !exists ) { // Add edge
332 Neighbor nb_1( _nb1[n1].size(), n2, _nb2[n2].size() );
333 Neighbor nb_2( nb_1.dual, n1, nb_1.iter );
334 _nb1[n1].push_back( nb_1 );
335 _nb2[n2].push_back( nb_2 );
336 }
337 }
338
339 /// Calculates second-order neighbors (i.e., neighbors of neighbors) of node n1 of type 1.
340 /** If include == true, includes n1 itself, otherwise excludes n1.
341 */
342 std::vector<size_t> delta1( size_t n1, bool include = false ) const;
343
344 /// Calculates second-order neighbors (i.e., neighbors of neighbors) of node n2 of type 2.
345 /** If include == true, includes n2 itself, otherwise excludes n2.
346 */
347 std::vector<size_t> delta2( size_t n2, bool include = false ) const;
348
349 /// Returns true if the graph is connected
350 /** \todo Should be optimized by invoking boost::graph library
351 */
352 bool isConnected() const;
353
354 /// Returns true if the graph is a tree, i.e., if it is singly connected and connected.
355 bool isTree() const;
356
357 /// Writes this BipartiteGraph to an output stream in GraphViz .dot syntax
358 void printDot( std::ostream& os ) const;
359
360 /// @name Backwards compatibility layer (to be removed soon)
361 //@{
362 void indexEdges() {
363 std::cerr << "Warning: this BipartiteGraph edge interface is obsolete!" << std::endl;
364 _edges.clear();
365 _vv2e.clear();
366 size_t i=0;
367 foreach(const Neighbors &nb1s, _nb1) {
368 foreach(const Neighbor &n2, nb1s) {
369 Edge e(i, n2.node);
370 _edges.push_back(e);
371 }
372 i++;
373 }
374 sort(_edges.begin(), _edges.end()); // unnecessary?
375
376 i=0;
377 foreach(const Edge& e, _edges) {
378 _vv2e[e] = i++;
379 }
380
381 _edge_indexed = true;
382 }
383
384 const Edge& edge(size_t e) const {
385 assert(_edge_indexed);
386 return _edges[e];
387 }
388
389 const std::vector<Edge>& edges() const {
390 return _edges;
391 }
392
393 size_t VV2E(size_t n1, size_t n2) const {
394 assert(_edge_indexed);
395 Edge e(n1,n2);
396 hash_map<Edge,size_t>::const_iterator i = _vv2e.find(e);
397 assert(i != _vv2e.end());
398 return i->second;
399 }
400
401 size_t nr_edges() const {
402 assert(_edge_indexed);
403 return _edges.size();
404 }
405 //}@
406
407 private:
408 /// Checks internal consistency
409 void check() const;
410 };
411
412
413 template<typename EdgeInputIterator>
414 void BipartiteGraph::construct( size_t nr1, size_t nr2, EdgeInputIterator begin, EdgeInputIterator end ) {
415 _nb1.clear();
416 _nb1.resize( nr1 );
417 _nb2.clear();
418 _nb2.resize( nr2 );
419
420 for( EdgeInputIterator e = begin; e != end; e++ ) {
421 #ifdef DAI_DEBUG
422 addEdge( e->first, e->second, true );
423 #else
424 addEdge( e->first, e->second, false );
425 #endif
426 }
427 }
428
429
430 } // end of namespace dai
431
432
433 /** \example example_bipgraph.cpp
434 * This example deals with the following bipartite graph:
435 * \dot
436 * graph example {
437 * ordering=out;
438 * subgraph cluster_type1 {
439 * node[shape=circle,width=0.4,fixedsize=true,style=filled];
440 * 12 [label="2"];
441 * 11 [label="1"];
442 * 10 [label="0"];
443 * }
444 * subgraph cluster_type2 {
445 * node[shape=polygon,regular=true,sides=4,width=0.4,fixedsize=true,style=filled];
446 * 21 [label="1"];
447 * 20 [label="0"];
448 * }
449 * 10 -- 20;
450 * 11 -- 20;
451 * 12 -- 20;
452 * 11 -- 21;
453 * 12 -- 21;
454 * }
455 * \enddot
456 * It has three nodes of type 1 (drawn as circles) and two nodes of type 2 (drawn as rectangles).
457 * Node 0 of type 1 has only one neighbor (node 0 of type 2), but node 0 of type 2 has three neighbors (nodes 0,1,2 of type 1).
458 * The example code shows how to construct a BipartiteGraph object representing this bipartite graph and
459 * how to iterate over nodes and their neighbors.
460 *
461 * \section Output
462 * \verbinclude examples/example_bipgraph.out
463 *
464 * \section Source
465 */
466
467
468 #endif