apache / incubator-retired-mrql / 1b271526e4d275a80ef3abc6d53d756802f9f428 / . / queries / factorization2.mrql

// Matrix factorization using functions (slower than factorization.mrql). | |

// Build the matrices first using the build_matrix.mrql query | |

Mmatrix = source(binary,"tmp/Xmatrix.bin"); | |

Hmatrix = source(binary,"tmp/Ymatrix.bin"); | |

Wmatrix = source(binary,"tmp/Zmatrix.bin"); | |

type matrix = !{(double,long,long)}; | |

function transpose ( X: matrix ): matrix { | |

select (x,j,i) | |

from (x,i,j) in X | |

}; | |

// matrix multiplication: | |

function multiply ( X: matrix, Y: matrix ): matrix { | |

select (sum(z),i,j) | |

from (x,i,k) in X, (y,k,j) in Y, z = x*y | |

group by (i,j) | |

}; | |

// cell-wise multiplication: | |

function Cmult ( X: matrix, Y: matrix ): matrix { | |

select ( x*y, i, j ) | |

from (x,i,j) in X, (y,i,j) in Y | |

}; | |

// cell-wise division: | |

function Cdiv ( X: matrix, Y: matrix ): matrix { | |

select ( x/y, i, j ) | |

from (x,i,j) in X, (y,i,j) in Y | |

}; | |

// Gaussian non-negative matrix factorization (from SystemML paper) | |

function factorize ( V: matrix, Hinit: matrix, Winit: matrix ): (matrix,matrix) { | |

repeat (H,W) = (Hinit,Winit) | |

step ( Cmult(H,Cdiv(multiply(transpose(W),V),multiply(transpose(W),multiply(W,H)))), | |

Cmult(W,Cdiv(multiply(V,transpose(H)),multiply(W,multiply(H,transpose(H))))) ) | |

limit 4 | |

}; | |

factorize(Mmatrix,Hmatrix,Wmatrix); |