Currently in Hama, eigenvalue decomposition is not implement.So In STEP 4,
it is hard to migrate it.so I
work out an idea to bypass it. before Step 4, I can let L be
denseMatrix.when I come to Step 4, I can
transform L into submatrix.in Jama,eigenvalue decomposition is support
although it is not parallel computing.So I can get eigValues ,eigVectors
values.But after that in step 5,It need to sort two matrix.
I want to use the hbase sort function.so Hwo can transform this two
submatrix into two densematrix?
or other way ?
/**
* STEP 4
* Calculate the eigen values and vectors of this
covariance matrix
*
* % Get the eigenvectors (columns of Vectors) and
eigenvalues (diag of
Values)
*/
EigenvalueDecomposition eigen = L.eig();
eigValues = eigen.getD();
eigVectors = eigen.getV();
/**
* STEP 5
* % Sort the vectors/values according to size of
eigenvalue
*/
Matrix[] eigDVSorted = sortem(eigValues, eigVectors);
eigValues = eigDVSorted[0];
eigVectors = eigDVSorted[1];
/**
* STEP 6
* % Convert the eigenvectors of A'*A into
eigenvectors of A*A'
*/
eigVectors = A.times(eigVectors);
/**
* STEP 7
* % Get the eigenvalues out of the diagonal
matrix and
* % normalize them so the evalues are
specifically for cov(A'), not
A*A'.
*/
double[] values = diag(eigValues);
for(int i = 0; i < values.length; i++)
values[i] /= A.getColumnDimension() - 1;
/**
* STEP 8
* % Normalize Vectors to unit length, kill
vectors corr. to tiny
evalues
*/
numEigenVecs = 0;
for(int i = 0; i < eigVectors.getColumnDimension(); i++) {
Matrix tmp;
if (values[i] < 0.0001)
{
tmp = new
Matrix(eigVectors.getRowDimension(),1);
}
else
{
tmp =
eigVectors.getMatrix(0,eigVectors.getRowDimension()-1,i,i).times(
1 / eigVectors.getMatrix(0,
eigVectors.getRowDimension() - 1, i,
i).normF());
numEigenVecs++;
}
eigVectors.setMatrix(0,eigVectors.getRowDimension()-1,i,i,tmp);
//eigVectors.timesEquals(1 / eigVectors.getMatrix(0,
eigVectors.getRowDimension() - 1, i, i).normInf());
}
eigVectors =
eigVectors.getMatrix(0,eigVectors.getRowDimension() - 1, 0,
numEigenVecs - 1);
trained = true;
/*System.out.println("There are " + numGood + "
eigenVectors\n\nEigenVectorSize");
System.out.println(eigVectors.getRowDimension());
System.out.println(eigVectors.getColumnDimension());
try {
PrintWriter pw = new PrintWriter("c:\\tmp\\test.txt");
eigVectors.print(pw, 8, 4);
pw.flush();
pw.close();
} catch (Exception e) {
e.printStackTrace();
}
int width = pics[0].img.getWidth(null);
BufferedImage biAvg = imageFromMatrix(bigAvg.getArrayCopy()[0],
width);
try {
saveImage(new File("c:\\tmp\\test.jpg"), biAvg);
} catch (IOException e1) {
e1.printStackTrace();
}*/
}
/**
* Returns a number of eigenFace values to be used in a feature space
* @param pic
* @param number number of eigen feature values.
* @return will be of length number or this.getNumEigenVecs whichever is
the smaller
*/
public double[] getEigenFaces(Picture pic, int number)
{
if (number > numEigenVecs) //adjust the number to
the maxium number of
eigen vectors availiable
number = numEigenVecs;
double[] ret = new double[number];
double[] pixels = pic.getImagePixels();
Matrix face = new Matrix(pixels, pixels.length);
Matrix Vecs =
eigVectors.getMatrix(0,eigVectors.getRowDimension()-1, 0,
number-1).transpose();
Matrix rslt = Vecs.times(face);
for (int i=0; i<number; i++)
{
ret[i] = rslt.get(i,0);
}
return ret;
}
/**
* Gets the diagonal of a matrix
* @param M matrix
* @return
*/
private double[] diag(Matrix M) {
double[] dvec = new double[M.getColumnDimension()];
for(int i = 0; i < M.getColumnDimension(); i++)
dvec[i] = M.get(i, i);
return dvec;
}
/**
* Sorts the Eigenvalues and vectors in decending order
*
* @param D = eigen Values
* @param V = eigen Vectors
* @return
*/
private Matrix[] sortem(Matrix D, Matrix V) {
//dvec = diag(D); // get diagonal components
double[] dvec = diag(D);
//NV = zeros(size(V));
//[dvec,index_dv] = sort(dvec); // sort dvec, maintain index in
index_dv
class di_pair{ double value; int index; };
di_pair[] dvec_indexed = new di_pair[dvec.length];
for(int i = 0; i < dvec_indexed.length; i++) {
dvec_indexed[i] = new di_pair();
dvec_indexed[i].index = i;
dvec_indexed[i].value = dvec[i];
}
Comparator di_pair_sort = new Comparator() {
public int compare(Object arg0, Object arg1) {
di_pair lt = (di_pair)arg0;
di_pair rt = (di_pair)arg1;
double dif = (lt.value - rt.value);
if(dif > 0) return -1;
if(dif < 0) return 1;
else return 0;
}
};
Arrays.sort(dvec_indexed, di_pair_sort);
//index_dv = flipud(index_dv);
//for i = 1:size(D,1)
// ND(i,i) = D(index_dv(i),index_dv(i));
// NV(:,i) = V(:,index_dv(i));
//end;
Matrix D2 = new Matrix(D.getRowDimension(), D.getColumnDimension());
Matrix V2 = new Matrix(V.getRowDimension(), V.getColumnDimension());
for(int i = 0; i < dvec_indexed.length; i++) {
D2.set(i, i, D.get(dvec_indexed[i].index,
dvec_indexed[i].index));
int height = V.getRowDimension() - 1;
Matrix tmp =
V.getMatrix(dvec_indexed[i].index,dvec_indexed[i].index,0,height);
V2.setMatrix(i, i,0,height, tmp);
}
//TODO : Not sure why, but this has to be flipped - check this out
maybe?
Matrix V3 = new Matrix(V.getRowDimension(), V.getColumnDimension());
for (int i=0; i<V3.getRowDimension(); i++)
{
for (int j=0; j< V3.getColumnDimension(); j++)
{
V3.set(i,j,V2.get(V3.getRowDimension() - i - 1,
V3.getColumnDimension() - j - 1));
}
}
return new Matrix[] { D2, V3 };
}
public boolean isTrained() {
return trained;
}
public int getNumEigenVecs() {
return numEigenVecs;
}
}
any advice will be appreciated.thanks in advance.
--
View this message in context:
http://www.nabble.com/Hama--Problem-tp23630187p23666077.html
Sent from the Hadoop core-user mailing list archive at Nabble.com.