Context Navigation

← Previous Change
Next Change →

Changeset 135 for trunk/CrossPare/src/de/ugoe/cs/cpdp/dataprocessing

Timestamp:

07/18/16 12:26:03 (9 years ago)

Author:

sherbold

Message:

code documentation and formatting

Location:

trunk/CrossPare/src/de/ugoe/cs/cpdp/dataprocessing

Files:

: 13 edited

CLAMIProcessor.java (modified) (1 diff)
CLAProcessor.java (modified) (1 diff)
LogarithmTransform.java (modified) (1 diff)
MORPH.java (modified) (8 diffs)
MedianAsReference.java (modified) (1 diff)
NominalAttributeFilter.java (modified) (1 diff)
Oversampling.java (modified) (1 diff)
SynonymAttributePruning.java (modified) (2 diffs)
TCAPlusNormalization.java (modified) (2 diffs)
TopMetricFilter.java (modified) (13 diffs)
TransferComponentAnalysis.java (modified) (7 diffs)
Undersampling.java (modified) (1 diff)
ZScoreTargetNormalization.java (modified) (1 diff)

Legend:

: Unmodified
: Added
: Removed

trunk/CrossPare/src/de/ugoe/cs/cpdp/dataprocessing/CLAMIProcessor.java

-                      r86
+                      r135
     @Override
     public void setParameter(String parameters) {
+        // TODO Auto-generated method stub
+        // dummy, parameters not used
+    }

trunk/CrossPare/src/de/ugoe/cs/cpdp/dataprocessing/CLAProcessor.java

-                      r86
+                      r135
     @Override
     public void setParameter(String parameters) {
+        // TODO Auto-generated method stub
+        // dummy, parameters not used
+    }

trunk/CrossPare/src/de/ugoe/cs/cpdp/dataprocessing/LogarithmTransform.java

-                      r86
+                      r135
             Instance instance = traindata.instance(i);
             for (int j = 0; j < testdata.numAttributes(); j++) {
+                if (traindata.attribute(j) != classAttribute && traindata.attribute(j).isNumeric())
+                if (traindata.attribute(j) != classAttribute &&
+                    traindata.attribute(j).isNumeric())
+                {
                     if (instance.value(j) < 0) {

trunk/CrossPare/src/de/ugoe/cs/cpdp/dataprocessing/MORPH.java

-                      r120
+                      r135
 /**
  * Implements the MORPH data privatization.
+ * Implements the MORPH data privatization.
+ *
+ *
 …
      */
     Random rand = new Random();
     /**
      * parameter alpha for MORPH, default is 0.15
      */
     double alpha = 0.15;
     /**
      * parameter beta for MORPH, default is 0.35
      */
     double beta = 0.35;
     /**
      * Does not have parameters. String is ignored.
 …
         if (parameters != null && !parameters.equals("")) {
             String[] values = parameters.split(" ");
             if( values.length!=2 ) {
+            if (values.length != 2) {
                 throw new InvalidParameterException("MORPH requires two doubles as parameter or no parameters to use default values");
+            }
 …
                 alpha = Double.parseDouble(values[0]);
                 beta = Double.parseDouble(values[1]);
+            } catch(NumberFormatException e) {
+            }
+            catch (NumberFormatException e) {
                 throw new InvalidParameterException("MORPH requires two doubles as parameter or no parameters to use default values");
+            }
 …
     @Override
     public void apply(Instances testdata, SetUniqueList<Instances> traindataSet) {
         for( Instances traindata : traindataSet ) {
+        for (Instances traindata : traindataSet) {
             applyMORPH(traindata);
+        }
 …
         applyMORPH(traindata);
+    }
     /**
+     *
 …
      * </p>
+     *
+     * @param data data to which the processor is applied
+     * @param data
+     *            data to which the processor is applied
      */
     public void applyMORPH(Instances data) {
         for (int i=0; i<data.numInstances(); i++ ) {
+        for (int i = 0; i < data.numInstances(); i++) {
             morphInstance(data.get(i), data);
+        }
+    }
     /**
      * <p>
 …
      * </p>
+     *
+     * @param instance instance that is morphed
+     * @param data data based on which the instance is morphed
+     * @param instance
+     *            instance that is morphed
+     * @param data
+     *            data based on which the instance is morphed
      */
     public void morphInstance(Instance instance, Instances data) {
         Instance nearestUnlikeNeighbor = getNearestUnlikeNeighbor(instance, data);
+        if( nearestUnlikeNeighbor==null ) {
+            throw new RuntimeException("could not find nearest unlike neighbor within the data: " + data.relationName());
+        if (nearestUnlikeNeighbor == null) {
+            throw new RuntimeException("could not find nearest unlike neighbor within the data: " +
+                data.relationName());
+        }
+        for( int j=0; j<data.numAttributes() ; j++ ) {
+            if( data.attribute(j)!=data.classAttribute() && data.attribute(j).isNumeric()) {
+                double randVal = rand.nextDouble()*(beta-alpha)+alpha;
+                instance.setValue(j, instance.value(j) + randVal*(instance.value(j)-nearestUnlikeNeighbor.value(j)) );
+        for (int j = 0; j < data.numAttributes(); j++) {
+            if (data.attribute(j) != data.classAttribute() && data.attribute(j).isNumeric()) {
+                double randVal = rand.nextDouble() * (beta - alpha) + alpha;
+                instance.setValue(j, instance.value(j) +
+                    randVal * (instance.value(j) - nearestUnlikeNeighbor.value(j)));
+            }
+        }
+    }
     /**
      * <p>
      * Determines the nearest unlike neighbor of an instance.
+     * Determines the nearest unlike neighbor of an instance.
      * </p>
+     *
+     * @param instance instance to which the nearest unlike neighbor is determined
+     * @param data data where the nearest unlike neighbor is determined from
+     * @param instance
+     *            instance to which the nearest unlike neighbor is determined
+     * @param data
+     *            data where the nearest unlike neighbor is determined from
      * @return nearest unlike instance
      */
     public Instance getNearestUnlikeNeighbor(Instance instance, Instances data) {
         Instance nearestUnlikeNeighbor = null;
         double[] instanceVector = new double[data.numAttributes()-1];
+        double[] instanceVector = new double[data.numAttributes() - 1];
         int tmp = 0;
         for( int j=0; j<data.numAttributes(); j++ ) {
             if( data.attribute(j)!=data.classAttribute() && data.attribute(j).isNumeric()) {
+        for (int j = 0; j < data.numAttributes(); j++) {
+            if (data.attribute(j) != data.classAttribute() && data.attribute(j).isNumeric()) {
                 instanceVector[tmp] = instance.value(j);
+            }
+        }
         double minDistance = Double.MAX_VALUE;
         for( int i=0 ; i<data.numInstances() ; i++ ) {
             if( instance.classValue() != data.instance(i).classValue() ) {
+        for (int i = 0; i < data.numInstances(); i++) {
+            if (instance.classValue() != data.instance(i).classValue()) {
                 double[] otherVector = new double[data.numAttributes() - 1];
                 tmp = 0;
                 for (int j = 0; j < data.numAttributes(); j++) {
+                    if (data.attribute(j) != data.classAttribute() && data.attribute(j).isNumeric()) {
+                    if (data.attribute(j) != data.classAttribute() &&
+                        data.attribute(j).isNumeric())
+                    {
                         otherVector[tmp++] = data.instance(i).value(j);
+                    }
+                }
                 if( MathArrays.distance(instanceVector, otherVector)<minDistance) {
+                if (MathArrays.distance(instanceVector, otherVector) < minDistance) {
                     minDistance = MathArrays.distance(instanceVector, otherVector);
                     nearestUnlikeNeighbor = data.instance(i);

trunk/CrossPare/src/de/ugoe/cs/cpdp/dataprocessing/MedianAsReference.java

-                      r86
+                      r135
             Instance instance = traindata.instance(i);
             for (int j = 0; j < traindata.numAttributes(); j++) {
+                if (traindata.attribute(j) != classAttribute && traindata.attribute(j).isNumeric())
+                if (traindata.attribute(j) != classAttribute &&
+                    traindata.attribute(j).isNumeric())
+                {
                     instance.setValue(j, instance.value(j) + (median[j] - currentmedian[j]));

trunk/CrossPare/src/de/ugoe/cs/cpdp/dataprocessing/NominalAttributeFilter.java

-                      r86
+                      r135
             // delete all instances where nominal attribute has the value of one of the parameter
             if (indexOfnominalAttributeValues.contains(wekaInstance
                 .value(indexOfConfidenceAttribute)))
+            if (indexOfnominalAttributeValues
+                .contains(wekaInstance.value(indexOfConfidenceAttribute)))
+            {
                 traindata.delete(j);

trunk/CrossPare/src/de/ugoe/cs/cpdp/dataprocessing/Oversampling.java

-                      r86
+                      r135
             Resample resample = new Resample();
-            // TODO: resample.setSampleSizePercent((100.0*counts[1])/100+0.01);
-            // Ohne +0.01 wird bei tomcat, xerces-1.2 und jedit-4.0 ein negative
-            // weniger zurückgegeben
             resample.setSampleSizePercent((100.0 * counts[0]) / counts[1]);
             try {

trunk/CrossPare/src/de/ugoe/cs/cpdp/dataprocessing/SynonymAttributePruning.java

-                      r86
+                      r135
         double distance;
         for (int j = traindata.numAttributes() - 1; j >= 0; j--) {
             if( j!=traindata.classIndex() ) {
+            if (j != traindata.classIndex()) {
                 boolean hasClosest = false;
                 for (int i1 = 0; !hasClosest && i1 < traindata.size(); i1++) {
 …
                             double distanceJ = Double.MAX_VALUE;
                             for (int k = 0; k < traindata.numAttributes(); k++) {
+                                distance = Math.abs(traindata.get(i1).value(k) - traindata.get(i2).value(k));
+                                distance = Math
+                                    .abs(traindata.get(i1).value(k) - traindata.get(i2).value(k));
                                 if (distance < minVal) {
                                     minVal = distance;

trunk/CrossPare/src/de/ugoe/cs/cpdp/dataprocessing/TCAPlusNormalization.java

-                      r86
+                      r135
 import weka.core.Instances;
+// normalization selected according to TCA+ rules (TCA has to be applied separately
+/**
+ * <p>
+ * Normalization selected according to the TCA+ rules after Nam et al. (Transfer Defect Learning).
+ * </p>
+ *
+ * @author Steffen Herbold
+ */
 public class TCAPlusNormalization implements IProcessesingStrategy {
 …
     @Override
     public void setParameter(String parameters) {
+        // TODO Auto-generated method stub
+        // dummy, paramters not used
+    }
+    /*
+     * (non-Javadoc)
+     *
+     * @see de.ugoe.cs.cpdp.dataprocessing.IProcessesingStrategy#apply(weka.core.Instances,
+     * weka.core.Instances)
+     */
     @Override
     public void apply(Instances testdata, Instances traindata) {
         applyTCAPlus(testdata, traindata);
+    }
     private void applyTCAPlus(Instances testdata, Instances traindata) {
         DistChar dcTest = WekaUtils.datasetDistance(testdata);
         DistChar dcTrain = WekaUtils.datasetDistance(traindata);
         // RULE 1:
+        if( 0.9*dcTrain.mean<=dcTest.mean && 1.1*dcTrain.mean>=dcTest.mean &&
+.9*dcTrain.std<=dcTest.std && 1.1*dcTrain.std>=dcTest.std) {
+        if (0.9 * dcTrain.mean <= dcTest.mean && 1.1 * dcTrain.mean >= dcTest.mean &&
+.9 * dcTrain.std <= dcTest.std && 1.1 * dcTrain.std >= dcTest.std)
+        {
             // do nothing
+        }
         // RULE 2:
+        else if((0.4*dcTrain.min>dcTest.min || 1.6*dcTrain.min<dcTest.min) &&
+                (0.4*dcTrain.max>dcTest.max || 1.6*dcTrain.min<dcTest.max) &&
+                (0.4*dcTrain.min>dcTest.num || 1.6*dcTrain.min<dcTest.num)) {
+        else if ((0.4 * dcTrain.min > dcTest.min || 1.6 * dcTrain.min < dcTest.min) &&
+            (0.4 * dcTrain.max > dcTest.max || 1.6 * dcTrain.min < dcTest.max) &&
+            (0.4 * dcTrain.min > dcTest.num || 1.6 * dcTrain.min < dcTest.num))
+        {
             NormalizationUtil.minMax(testdata);
             NormalizationUtil.minMax(traindata);
+        }
         // RULE 3:
+        else if((0.4*dcTrain.std>dcTest.std && dcTrain.num<dcTest.num) ||
+                (1.6*dcTrain.std<dcTest.std)&& dcTrain.num>dcTest.num) {
+        else if ((0.4 * dcTrain.std > dcTest.std && dcTrain.num < dcTest.num) ||
+            (1.6 * dcTrain.std < dcTest.std) && dcTrain.num > dcTest.num)
+        {
             NormalizationUtil.zScoreTraining(testdata, traindata);
+        }
         // RULE 4:
+        else if((0.4*dcTrain.std>dcTest.std && dcTrain.num>dcTest.num) ||
+                (1.6*dcTrain.std<dcTest.std)&& dcTrain.num<dcTest.num) {
+        else if ((0.4 * dcTrain.std > dcTest.std && dcTrain.num > dcTest.num) ||
+            (1.6 * dcTrain.std < dcTest.std) && dcTrain.num < dcTest.num)
+        {
             NormalizationUtil.zScoreTarget(testdata, traindata);
+        }
         //RULE 5:
+        // RULE 5:
         else {
             NormalizationUtil.zScore(testdata);

trunk/CrossPare/src/de/ugoe/cs/cpdp/dataprocessing/TopMetricFilter.java

-                      r129
+                      r135
      */
     double correlationThreshold = 0.5;
     /*
      * (non-Javadoc)
 …
     @Override
     public void setParameter(String parameters) {
         if( parameters!=null && !parameters.equals("")) {
+        if (parameters != null && !parameters.equals("")) {
             correlationThreshold = Double.parseDouble(parameters);
+        }
 …
+    }
+    private void determineTopKAttributes(Instances testdata, SetUniqueList<Instances> traindataSet) throws Exception {
+        Integer[] counts = new Integer[traindataSet.get(0).numAttributes()-1];
+        IntStream.range(0,counts.length).forEach(val -> counts[val] = 0);
+        for( Instances traindata : traindataSet ) {
+    private void determineTopKAttributes(Instances testdata, SetUniqueList<Instances> traindataSet)
+        throws Exception
+    {
+        Integer[] counts = new Integer[traindataSet.get(0).numAttributes() - 1];
+        IntStream.range(0, counts.length).forEach(val -> counts[val] = 0);
+        for (Instances traindata : traindataSet) {
             J48 decisionTree = new J48();
             decisionTree.buildClassifier(traindata);
             int k=0;
             for( int j=0; j<traindata.numAttributes(); j++) {
                 if(j!=traindata.classIndex()){
                     if( decisionTree.toString().contains(traindata.attribute(j).name()) ) {
                         counts[k] = counts[k]+1;
+            int k = 0;
+            for (int j = 0; j < traindata.numAttributes(); j++) {
+                if (j != traindata.classIndex()) {
+                    if (decisionTree.toString().contains(traindata.attribute(j).name())) {
+                        counts[k] = counts[k] + 1;
+                    }
                     k++;
 …
+        }
         int[] topkIndex = new int[counts.length];
         IntStream.range(0,counts.length).forEach(val -> topkIndex[val] = val);
+        IntStream.range(0, counts.length).forEach(val -> topkIndex[val] = val);
         SortUtils.quicksort(counts, topkIndex, true);
         // get CFSs for each training set
         List<Set<Integer>> cfsSets = new LinkedList<>();
         for( Instances traindata : traindataSet ) {
+        for (Instances traindata : traindataSet) {
             boolean selectionSuccessful = false;
             boolean secondAttempt = false;
 …
                         attsel.SelectAttributes(traindataCopy);
                         Set<Integer> cfsSet = new HashSet<>();
                         for( int attr : attsel.selectedAttributes() ) {
+                        for (int attr : attsel.selectedAttributes()) {
                             cfsSet.add(attr);
+                        }
 …
                         attsel.SelectAttributes(traindata);
                         Set<Integer> cfsSet = new HashSet<>();
                         for( int attr : attsel.selectedAttributes() ) {
+                        for (int attr : attsel.selectedAttributes()) {
                             cfsSet.add(attr);
+                        }
 …
             while (!selectionSuccessful); // dummy loop for internal continue
+        }
         double[] coverages = new double[topkIndex.length];
         for( Set<Integer> cfsSet : cfsSets ) {
+        for (Set<Integer> cfsSet : cfsSets) {
             Set<Integer> topkSet = new HashSet<>();
             for( int k=0; k<topkIndex.length ; k++ ) {
+            for (int k = 0; k < topkIndex.length; k++) {
                 topkSet.add(topkIndex[k]);
                 coverages[k] += (coverage(topkSet, cfsSet)/traindataSet.size());
+                coverages[k] += (coverage(topkSet, cfsSet) / traindataSet.size());
+            }
+        }
         double bestCoverageValue = Double.MIN_VALUE;
         int bestCoverageIndex = 0;
         for( int i=0; i<coverages.length; i++ ) {
             if( coverages[i]>bestCoverageValue) {
+        for (int i = 0; i < coverages.length; i++) {
+            if (coverages[i] > bestCoverageValue) {
                 bestCoverageValue = coverages[i];
                 bestCoverageIndex = i;
 …
         SpearmansCorrelation corr = new SpearmansCorrelation();
         double[][] correlationMatrix = new double[bestCoverageIndex][bestCoverageIndex];
         for( Instances traindata : traindataSet ) {
+        for (Instances traindata : traindataSet) {
             double[][] vectors = new double[bestCoverageIndex][traindata.size()];
             for( int i=0; i<traindata.size(); i++ ) {
                 for( int j=0; j<bestCoverageIndex; j++) {
+            for (int i = 0; i < traindata.size(); i++) {
+                for (int j = 0; j < bestCoverageIndex; j++) {
                     vectors[j][i] = traindata.get(i).value(topkIndex[j]);
+                }
+            }
             for( int j=0; j<bestCoverageIndex; j++ ) {
                 for( int k=j+1; k<bestCoverageIndex; k++ ) {
+            for (int j = 0; j < bestCoverageIndex; j++) {
+                for (int k = j + 1; k < bestCoverageIndex; k++) {
                     correlationMatrix[j][k] = Math.abs(corr.correlation(vectors[j], vectors[k]));
+                }
 …
+        }
         Set<Integer> topkSetIndexSet = new TreeSet<>();
+        // j<30 ensures that the computational time does not explode since the powerset is 2^n in complexity
+        for( int j=0; j<bestCoverageIndex && j<30 ; j++ ) {
+        // j<30 ensures that the computational time does not explode since the powerset is 2^n in
+        // complexity
+        for (int j = 0; j < bestCoverageIndex && j < 30; j++) {
             topkSetIndexSet.add(j);
+        }
 …
         double bestOptCoverage = Double.MIN_VALUE;
         Set<Integer> opttopkSetIndexSet = null;
         for( Set<Integer> combination : allCombinations ) {
             if( isUncorrelated(correlationMatrix, combination) ) {
+        for (Set<Integer> combination : allCombinations) {
+            if (isUncorrelated(correlationMatrix, combination)) {
                 double currentCoverage = 0.0;
                 Set<Integer> topkCombination = new TreeSet<>();
                 for( Integer index : combination ) {
+                for (Integer index : combination) {
                     topkCombination.add(topkIndex[index]);
+                }
                 for( Set<Integer> cfsSet : cfsSets ) {
                     currentCoverage += (coverage(topkCombination, cfsSet)/traindataSet.size());
+                }
                 if( currentCoverage > bestOptCoverage ) {
+                for (Set<Integer> cfsSet : cfsSets) {
+                    currentCoverage += (coverage(topkCombination, cfsSet) / traindataSet.size());
+                }
+                if (currentCoverage > bestOptCoverage) {
                     bestOptCoverage = currentCoverage;
                     opttopkSetIndexSet = combination;
 …
+        }
         Set<Integer> opttopkIndex = new TreeSet<>();
         for( Integer index : opttopkSetIndexSet) {
+        for (Integer index : opttopkSetIndexSet) {
             opttopkIndex.add(topkIndex[index]);
+        }
         Console.traceln(Level.FINE, "selected the following metrics:");
         for( Integer index : opttopkIndex) {
+        for (Integer index : opttopkIndex) {
             Console.traceln(Level.FINE, traindataSet.get(0).attribute(index).name());
+        }
         // finally remove attributes
         for( int j=testdata.numAttributes()-1; j>=0; j-- ) {
             if( j!=testdata.classIndex() && !opttopkIndex.contains(j) ) {
+        for (int j = testdata.numAttributes() - 1; j >= 0; j--) {
+            if (j != testdata.classIndex() && !opttopkIndex.contains(j)) {
                 testdata.deleteAttributeAt(j);
                 for( Instances traindata : traindataSet ) {
+                for (Instances traindata : traindataSet) {
                     traindata.deleteAttributeAt(j);
+                }
 …
+        }
+    }
     private boolean isUncorrelated(double[][] correlationMatrix, Set<Integer> combination) {
         Integer[] intCombination = combination.toArray(new Integer[0]);
         boolean areUncorrelated = true;
+        for( int i=0 ; areUncorrelated && i<intCombination.length ; i++ ) {
+            for( int j=i+1; areUncorrelated && j<intCombination.length ; j++ ) {
+                areUncorrelated &= correlationMatrix[intCombination[i]][intCombination[j]]>correlationThreshold;
+        for (int i = 0; areUncorrelated && i < intCombination.length; i++) {
+            for (int j = i + 1; areUncorrelated && j < intCombination.length; j++) {
+                areUncorrelated &=
+                    correlationMatrix[intCombination[i]][intCombination[j]] > correlationThreshold;
+            }
+        }
         return areUncorrelated;
+    }
     private double coverage(Set<Integer> topkSet, Set<Integer> cfsSet) {
         Set<Integer> topkSetCopy1 = new HashSet<>(topkSet);
 …
         Set<Integer> topkSetCopy2 = new HashSet<>(topkSet);
         topkSetCopy2.addAll(cfsSet);
         return ((double) topkSetCopy1.size())/topkSetCopy2.size();
+        return ((double) topkSetCopy1.size()) / topkSetCopy2.size();
+    }
+}

trunk/CrossPare/src/de/ugoe/cs/cpdp/dataprocessing/TransferComponentAnalysis.java

-                      r86
+                      r135
  * </p>
+ *
- * TODO comment class
  * @author Steffen Herbold
  */
 public class TransferComponentAnalysis implements IProcessesingStrategy {
+    /**
+     * Dimension of the reduced data.
+     */
     int reducedDimension = 5;
+    /*
+     * (non-Javadoc)
+     *
+     * @see de.ugoe.cs.cpdp.IParameterizable#setParameter(java.lang.String)
+     */
     @Override
     public void setParameter(String parameters) {
+    }
+        // dummy, paramters ignored
+    }
+    /*
+     * (non-Javadoc)
+     *
+     * @see de.ugoe.cs.cpdp.dataprocessing.IProcessesingStrategy#apply(weka.core.Instances,
+     * weka.core.Instances)
+     */
     @Override
     public void apply(Instances testdata, Instances traindata) {
 …
+    }
+    /**
+     * <p>
+     * calculates the linear kernel function between two instances
+     * </p>
+     *
+     * @param x1
+     *            first instance
+     * @param x2
+     *            second instance
+     * @return kernel value
+     */
     private double linearKernel(Instance x1, Instance x2) {
         double value = 0.0d;
 …
+    }
+    /**
+     * <p>
+     * Applies TCA to the test and training data.
+     * </p>
+     *
+     * @param testdata
+     *            the test data
+     * @param traindata
+     *            the training data
+     */
     private void applyTCA(Instances testdata, Instances traindata) {
         final int sizeTest = testdata.numInstances();
 …
+    }
+    /**
+     * <p>
+     * Creates the kernel matrix of the test and training data
+     * </p>
+     *
+     * @param testdata
+     *            the test data
+     * @param traindata
+     *            the training data
+     * @return kernel matrix
+     */
     private PrimitiveMatrix buildKernel(Instances testdata, Instances traindata) {
         final int kernelDim = traindata.numInstances() + testdata.numInstances();
 …
+    }
+    /**
+     * <p>
+     * Calculates the kernel norm matrix, i.e., the matrix which is used for matrix multiplication
+     * to calculate the kernel norm.
+     * </p>
+     *
+     * @param dimTest
+     *            dimension of the test data
+     * @param sizeTrain
+     *            number of instances of the training data
+     * @return kernel norm matrix
+     */
     private PrimitiveMatrix buildKernelNormMatrix(final int dimTest, final int sizeTrain) {
         final double trainSquared = 1.0 / (sizeTrain * (double) sizeTrain);
 …
+    }
+    /**
+     * <p>
+     * Creates the center matrix
+     * </p>
+     *
+     * @param sizeTest
+     *            number of instances of the test data
+     * @param sizeTrain
+     *            number of instances of the training data
+     * @return center matrix
+     */
     private PrimitiveMatrix buildCenterMatrix(final int sizeTest, final int sizeTrain) {
         Builder<PrimitiveMatrix> centerMatrix =
 …
+    }
+    /**
+     * <p>
+     * Builds the mu-Matrix for offsetting values.
+     * </p>
+     *
+     * @param sizeTest
+     *            number of instances of the test data
+     * @param sizeTrain
+     *            number of instances of the training data
+     * @param mu
+     *            mu parameter
+     * @return mu-Matrix
+     */
     private PrimitiveMatrix buildMuMatrix(final int sizeTest,
                                           final int sizeTrain,

trunk/CrossPare/src/de/ugoe/cs/cpdp/dataprocessing/Undersampling.java

-                      r86
+                      r135
             Resample resample = new Resample();
-            // TODO: resample.setSampleSizePercent((100.0*counts[1])/100+0.01);
-            // Ohne +0.01 wird bei tomcat, xerces-1.2 und jedit-4.0 ein negative weniger
-            // zurückgegeben
             resample.setSampleSizePercent((100.0 * counts[1]) / counts[0]);
             try {

trunk/CrossPare/src/de/ugoe/cs/cpdp/dataprocessing/ZScoreTargetNormalization.java

-                      r86
+                      r135
  * @author Steffen Herbold
  */
+public class ZScoreTargetNormalization implements ISetWiseProcessingStrategy, IProcessesingStrategy
+public class ZScoreTargetNormalization
+    implements ISetWiseProcessingStrategy, IProcessesingStrategy
+{

Note: See TracChangeset for help on using the changeset viewer.

Download in other formats: