forked from KEMT/zpwiki
		
	pagerank
This commit is contained in:
		
							parent
							
								
									4989384544
								
							
						
					
					
						commit
						cfe6e6a52c
					
				
							
								
								
									
										149
									
								
								pages/students/2016/jan_holp/pagerank.js
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										149
									
								
								pages/students/2016/jan_holp/pagerank.js
									
									
									
									
									
										Normal file
									
								
							@ -0,0 +1,149 @@
 | 
				
			|||||||
 | 
					//"use strict";
 | 
				
			||||||
 | 
					// pagerank.js 0.0.1
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					//Use a random surfer algorithm to determine the relative 
 | 
				
			||||||
 | 
					//rank of nodes. The importance of each node is determined
 | 
				
			||||||
 | 
					//by the number of incoming links as well as the importance 
 | 
				
			||||||
 | 
					//of those incoming links. 
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					// Expose
 | 
				
			||||||
 | 
					// ----------
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					//Expose our library to be called externally
 | 
				
			||||||
 | 
					module.exports = function (nodeMatrix, linkProb, tolerance, callback, debug) {
 | 
				
			||||||
 | 
					    if (!nodeMatrix || !linkProb || !tolerance || !callback) {
 | 
				
			||||||
 | 
					        throw new Error("Provide 4 arguments: "+
 | 
				
			||||||
 | 
					            "nodeMatrix, link probability, tolerance, callback");
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					    //If debug is unset set it to false
 | 
				
			||||||
 | 
					    if (!debug) { 
 | 
				
			||||||
 | 
					        debug=false;
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					    return new Pagerank(nodeMatrix, linkProb, tolerance, callback, debug);
 | 
				
			||||||
 | 
					};
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					// Initialize
 | 
				
			||||||
 | 
					// ----------
 | 
				
			||||||
 | 
					function Pagerank(nodeMatrix, linkProb, tolerance, callback, debug) {
 | 
				
			||||||
 | 
					    //**OutgoingNodes:** represents an array of nodes. Each node in this 
 | 
				
			||||||
 | 
					    //array contains an array of nodes to which the corresponding node has
 | 
				
			||||||
 | 
					    //outgoing links.
 | 
				
			||||||
 | 
					    this.outgoingNodes = nodeMatrix;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    //console.log(this.outgoingNodes);
 | 
				
			||||||
 | 
					    //**LinkProb:** a value ??
 | 
				
			||||||
 | 
					    this.linkProb = linkProb;
 | 
				
			||||||
 | 
					    //**Tolerance:** the point at which a solution is deemed optimal. 
 | 
				
			||||||
 | 
					    //Higher values are more accurate, lower values are faster to computer. 
 | 
				
			||||||
 | 
					    this.tolerance = tolerance;
 | 
				
			||||||
 | 
					    this.callback = callback;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    //Number of outgoing nodes
 | 
				
			||||||
 | 
					    this.pageCount = Object.keys(this.outgoingNodes).length;
 | 
				
			||||||
 | 
					    //console.log(this.pageCount);
 | 
				
			||||||
 | 
					    //**Coeff:** coefficient for the likelihood that a page will be visited.
 | 
				
			||||||
 | 
					    this.coeff = (1-linkProb)/this.pageCount;
 | 
				
			||||||
 | 
					    
 | 
				
			||||||
 | 
					    this.probabilityNodes = !(nodeMatrix instanceof Array) ? {} : [];
 | 
				
			||||||
 | 
					    this.incomingNodes = !(nodeMatrix instanceof Array) ? {} : [];
 | 
				
			||||||
 | 
					    //console.log(this.incomingNodes);
 | 
				
			||||||
 | 
					    this.debug=debug;
 | 
				
			||||||
 | 
					    
 | 
				
			||||||
 | 
					    this.startRanking();
 | 
				
			||||||
 | 
					}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					//Start ranking 
 | 
				
			||||||
 | 
					// ----------
 | 
				
			||||||
 | 
					Pagerank.prototype.startRanking = function () {
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    //we initialize all of our probabilities
 | 
				
			||||||
 | 
					    var initialProbability = 1/this.pageCount, 
 | 
				
			||||||
 | 
					        outgoingNodes = this.outgoingNodes, i, a, index;
 | 
				
			||||||
 | 
					    
 | 
				
			||||||
 | 
					    //rearray the graph and generate initial probability
 | 
				
			||||||
 | 
					    for (i in outgoingNodes) {
 | 
				
			||||||
 | 
					        this.probabilityNodes[i]=initialProbability;
 | 
				
			||||||
 | 
					        for (a in outgoingNodes[i]) {
 | 
				
			||||||
 | 
					            index = outgoingNodes[i][a];
 | 
				
			||||||
 | 
					            if (!this.incomingNodes[index]) {
 | 
				
			||||||
 | 
					                this.incomingNodes[index]=[]; 
 | 
				
			||||||
 | 
					            }
 | 
				
			||||||
 | 
					            this.incomingNodes[index].push(i);
 | 
				
			||||||
 | 
					               // console.log(this.incomingNodes);
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					        }
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    //if debug is set, print each iteration
 | 
				
			||||||
 | 
					    if (this.debug) this.reportDebug(1)
 | 
				
			||||||
 | 
					    
 | 
				
			||||||
 | 
					    this.iterate(1);
 | 
				
			||||||
 | 
					};
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					//Log iteration to console 
 | 
				
			||||||
 | 
					// ----------
 | 
				
			||||||
 | 
					Pagerank.prototype.reportDebug = function (count) {
 | 
				
			||||||
 | 
					    //console.log("____ITERATION "+count+"____");
 | 
				
			||||||
 | 
					    //console.log("Pages: " + Object.keys(this.outgoingNodes).length);
 | 
				
			||||||
 | 
					    //console.log("outgoing %j", this.outgoingNodes);
 | 
				
			||||||
 | 
					    //console.log("incoming %j",this.incomingNodes);
 | 
				
			||||||
 | 
					    //console.log("probability %j",this.probabilityNodes);
 | 
				
			||||||
 | 
					};
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					//Calculate new weights 
 | 
				
			||||||
 | 
					// ----------
 | 
				
			||||||
 | 
					Pagerank.prototype.iterate = function(count) {
 | 
				
			||||||
 | 
					    var result = [];
 | 
				
			||||||
 | 
					    var resultHash={};
 | 
				
			||||||
 | 
					    var prob, ct, b, a, sum, res, max, min;
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    //For each node, we look at the incoming edges and 
 | 
				
			||||||
 | 
					    //the weight of the node connected via each edge. 
 | 
				
			||||||
 | 
					    //This weight is divided by the total number of 
 | 
				
			||||||
 | 
					    //outgoing edges from each weighted node and summed to 
 | 
				
			||||||
 | 
					    //determine the new weight of the original node.
 | 
				
			||||||
 | 
					    for (b in this.probabilityNodes) {
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					        sum = 0;
 | 
				
			||||||
 | 
					        if( this.incomingNodes[b] ) {
 | 
				
			||||||
 | 
					            for ( a=0; a<this.incomingNodes[b].length; a++) {
 | 
				
			||||||
 | 
					                prob = this.probabilityNodes[ this.incomingNodes[b][a] ];
 | 
				
			||||||
 | 
					                ct = this.outgoingNodes[ this.incomingNodes[b][a] ].length;
 | 
				
			||||||
 | 
					                sum += (prob/ct) ;
 | 
				
			||||||
 | 
					            }
 | 
				
			||||||
 | 
					        }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					        //determine if the new probability is within tolerance.
 | 
				
			||||||
 | 
					        res = this.coeff+this.linkProb*sum;
 | 
				
			||||||
 | 
					        max = this.probabilityNodes[b]+this.tolerance;
 | 
				
			||||||
 | 
					        min = this.probabilityNodes[b]-this.tolerance;   
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					        //if the result has changed push that result
 | 
				
			||||||
 | 
					        if (min <= res && res<= max) {
 | 
				
			||||||
 | 
					            resultHash[b]=res;
 | 
				
			||||||
 | 
					            result.push(res);
 | 
				
			||||||
 | 
					        }
 | 
				
			||||||
 | 
					    
 | 
				
			||||||
 | 
					        //update the probability for node *b*
 | 
				
			||||||
 | 
					        this.probabilityNodes[b]=res;
 | 
				
			||||||
 | 
					        //console.log(this.probabilityNodes[b]);
 | 
				
			||||||
 | 
					        //console.log(res);
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    //When we have all results (no weights are changing) we return via callback
 | 
				
			||||||
 | 
					    if (result.length == this.pageCount) {
 | 
				
			||||||
 | 
					        if( !(this.outgoingNodes instanceof Array)) {
 | 
				
			||||||
 | 
					            return this.callback(null, resultHash);
 | 
				
			||||||
 | 
					        }
 | 
				
			||||||
 | 
					        return this.callback(null, result);
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					    
 | 
				
			||||||
 | 
					    //if debug is set, print each iteration
 | 
				
			||||||
 | 
					    if (this.debug) {
 | 
				
			||||||
 | 
					        this.reportDebug(count); 
 | 
				
			||||||
 | 
					    }
 | 
				
			||||||
 | 
					    
 | 
				
			||||||
 | 
					    ++count;
 | 
				
			||||||
 | 
					    return this.iterate(count);
 | 
				
			||||||
 | 
					};
 | 
				
			||||||
		Loading…
	
		Reference in New Issue
	
	Block a user