HBPMedical
diff --git a/‎.circleci/config.yml‎
Lines changed: 8 additions & 8 deletions b/‎.circleci/config.yml‎
Lines changed: 8 additions & 8 deletions
diff --git a/‎.gitignore‎
Lines changed: 2 additions & 0 deletions b/‎.gitignore‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎build.sh‎
Lines changed: 1 addition & 1 deletion b/‎build.sh‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎java-jsi-clus-rm/.bumpversion.cfg‎
Lines changed: 12 additions & 0 deletions b/‎java-jsi-clus-rm/.bumpversion.cfg‎
Lines changed: 12 additions & 0 deletions
diff --git a/‎java-jsi-clus-rm/.dockerignore‎
Lines changed: 8 additions & 0 deletions b/‎java-jsi-clus-rm/.dockerignore‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎java-jsi-clus-rm/.gitignore‎
Lines changed: 4 additions & 0 deletions b/‎java-jsi-clus-rm/.gitignore‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎java-jsi-clus-rm/Dockerfile‎
Lines changed: 50 additions & 0 deletions b/‎java-jsi-clus-rm/Dockerfile‎
Lines changed: 50 additions & 0 deletions
diff --git a/‎java-jsi-clus-rm/README.md‎
Lines changed: 42 additions & 0 deletions b/‎java-jsi-clus-rm/README.md‎
Lines changed: 42 additions & 0 deletions
diff --git a/‎java-jsi-clus-rm/build.sh‎
Lines changed: 32 additions & 0 deletions b/‎java-jsi-clus-rm/build.sh‎
Lines changed: 32 additions & 0 deletions
diff --git a/‎java-jsi-clus-rm/captain.yml‎
Lines changed: 7 additions & 0 deletions b/‎java-jsi-clus-rm/captain.yml‎
Lines changed: 7 additions & 0 deletions
@@ -150,14 +150,14 @@ jobs:
           name: "Test java-jsi-clus-fr"
           command: |
             PATH=$PATH:/$HOME/.captain/bin/ ./java-jsi-clus-fr/tests/test.sh
-     # - run:
-     #     name: "Build java-jsi-clus-rm"
-     #     command: |
-     #       PATH=$PATH:/$HOME/.captain/bin/ ./java-jsi-clus-rm/build.sh
-     # - run:
-     #     name: "Test java-jsi-clus-rm"
-     #     command: |
-     #       PATH=$PATH:/$HOME/.captain/bin/ ./java-jsi-clus-rm/tests/test.sh
+      - run:
+          name: "Build java-jsi-clus-rm"
+          command: |
+            PATH=$PATH:/$HOME/.captain/bin/ ./java-jsi-clus-rm/build.sh
+      - run:
+          name: "Test java-jsi-clus-rm"
+          command: |
+            PATH=$PATH:/$HOME/.captain/bin/ ./java-jsi-clus-rm/tests/test.sh
       - run:
           name: "Build python-jsi-hedwig"
           command: |
 
@@ -9,3 +9,5 @@ algorithm-repository.Rproj
 **/.Rhistory
 *.orig
 .Rproj.user
+/.metadata/
+/.recommenders/
@@ -22,7 +22,7 @@ else
   DOCKER="sudo docker"
 fi
 
-IMAGES="r-summary-stats r-linear-regression java-rapidminer java-jsi-clus-pct java-jsi-clus-pct-ts java-jsi-clus-fire java-jsi-clus-fr python-jsi-hedwig python-jsi-hinmine"
+IMAGES="r-summary-stats r-linear-regression java-rapidminer java-jsi-clus-pct java-jsi-clus-rm java-jsi-clus-pct-ts java-jsi-clus-fire java-jsi-clus-fr python-jsi-hedwig python-jsi-hinmine"
 
 commit_id="$(git rev-parse --short HEAD)"
 
 
@@ -0,0 +1,12 @@
+[bumpversion]
+current_version = 0.0.1
+commit = True
+tag = True
+tag_name = java-jsi-clus-rm-{new_version}
+parse = (?P<major>\d+)\.(?P<minor>\d+)\.(?P<patch>\d+)
+serialize = {major}.{minor}.{patch}
+
+[bumpversion:file:pom.xml]
+search = <version>{current_version}</version><!-- bumpversion -->
+replace = <version>{new_version}</version><!-- bumpversion -->
+
@@ -0,0 +1,8 @@
+.git/
+.idea/
+target/
+*~
+.settings
+.project
+deps/rm/
+deps/decompiled/
@@ -0,0 +1,4 @@
+target/
+.classpath
+.settings
+.project
@@ -0,0 +1,50 @@
+FROM hbpmip/java-base-build:3.5.2-jdk-8-0 as build-java-env
+
+COPY pom.xml /project/pom.xml
+COPY src/ /project/src
+COPY deps/ /project/deps
+
+RUN cp /usr/share/maven/ref/settings-docker.xml /root/.m2/settings.xml \
+    && mvn dependency:go-offline
+
+# Repeating copy of the settings works better. I dunno why.
+RUN cp /usr/share/maven/ref/settings-docker.xml /root/.m2/settings.xml \
+    && mvn package site
+
+FROM hbpmip/java-mip:0.5.7
+
+MAINTAINER martin.breskvar@ijs.si
+
+ENV DOCKER_IMAGE=java-jsi-clus-rm \
+	FUNCTION=java-jsi-clus-rm \
+    JAVA_CLASSPATH=${JAVA_CLASSPATH}:/opt/weka/props/:/usr/share/jars/jsi-clus-rm-deps.jar:/usr/share/jars/lib/*:/usr/share/jars/Redescription_mining_MW_ConstrainedGen1.jar:/usr/share/jars/CLUSNHMC.jar \
+    JAVA_MAINCLASS=eu.humanbrainproject.mip.algorithms.jsi.clus.rm.Entrypoint \
+    WEKA_HOME=/opt/weka
+
+COPY docker/databases-props/ /opt/weka/databases-props/
+COPY --from=build-java-env /project/deps/ /usr/share/jars/
+COPY --from=build-java-env /project/target/jsi-clus-rm-deps.jar /usr/share/jars/jsi-clus-rm-deps.jar
+COPY --from=build-java-env /project/target/site/ /var/www/html/
+COPY src/ /src/
+COPY doc/ /src/doc/
+
+RUN mkdir -p /opt/weka/props/weka/experiment \
+    && chown -R compute:compute /mip/ /opt/weka/ /usr/share/jars/
+
+RUN chown -R compute:compute /src/ \
+    && chown -R root:www-data /var/www/html/
+
+WORKDIR /usr/share/jars
+
+LABEL org.label-schema.build-date=$BUILD_DATE \
+      org.label-schema.name="hbpmip/java-jsi-clus-rm" \
+      org.label-schema.description="PCT-based algorithm for Redescription Mining" \
+      org.label-schema.url="https://github.com/LREN-CHUV/algorithm-repository" \
+      org.label-schema.vcs-type="git" \
+      org.label-schema.vcs-url="https://github.com/LREN-CHUV/algorithm-repository.git" \
+      org.label-schema.vcs-ref=$VCS_REF \
+      org.label-schema.version="$VERSION" \
+      org.label-schema.vendor="JSI KT and IRB ZEL" \
+      org.label-schema.license="GPLv3" \
+      org.label-schema.docker.dockerfile="Dockerfile" \
+      org.label-schema.schema-version="1.0"
@@ -0,0 +1,42 @@
+[![JSI](https://img.shields.io/badge/JSI-KT-AF4C64.svg)](http://kt.ijs.si/)
+[![DockerHub](https://img.shields.io/badge/docker-hbpmip%2Fjava--jsi--clus--rm-008bb8.svg)](https://hub.docker.com/r/hbpmip/java-jsi-clus-rm/)
+[![ImageVersion](https://images.microbadger.com/badges/version/hbpmip/java-jsi-clus-rm.svg)](https://hub.docker.com/r/hbpmip/java-jsi-clus-rm/tags "hbpmip/java-jsi-clus-rm image tags")
+[![ImageLayers](https://images.microbadger.com/badges/image/hbpmip/java-jsi-clus-rm.svg)](https://microbadger.com/#/images/hbpmip/java-jsi-clus-rm "hbpmip/java-jsi-clus-rm on microbadger")
+
+# hbpmip/java-jsi-clus-rm: Redescription Mining using Predictive Clustering from JSI and IRB
+
+Implementation of the Redescription mining algorithm based on Predictive Clustering Trees. 
+For more details see https://github.com/matmih/CLUS-RM-library.
+
+## Usage
+
+```sh
+  docker run --rm --env [list of environment variables] hbpmip/java-jsi-clus-rm compute
+```
+
+where the environment variables are:
+
+* NODE: name of the node (machine) used for execution
+* JOB_ID: ID of the job.
+* IN_JDBC_DRIVER: org.postgresql.Driver
+* IN_JDBC_URL: URL to the input database, e.g. jdbc:postgresql://db:5432/features
+* IN_JDBC_USER: User for the input database
+* IN_JDBC_PASSWORD: Password for the input database
+* OUT_JDBC_DRIVER: org.postgresql.Driver
+* OUT_JDBC_URL: URL to the output database, jdbc:postgresql://db:5432/woken
+* OUT_JDBC_USER: User for the output database
+* OUT_JDBC_PASSWORD: Password for the output database
+* PARAM_covariables: Attributes contained in the first data view.
+* PARAM_variables: Attributes contained in the second data view.
+* PARAM_query: Query selecting the data to feed into the algorithm for training
+* MODEL_PARAM_minJS: Specify minimal redescription accuracy (measured with Jaccard index) required to return it to the user. Parameter values are contained in [0,1]. (default is MODEL_PARAM_minJS=0.5)
+* MODEL_PARAM_maxPval: Specify maximal redescription p-value required to return it to the user. Parameter values are contained in [0,1]. (default is MODEL_PARAM_maxPval=0.01)		
+* MODEL_PARAM_MinSupport: Specify minimal redescription support required to return it to the user. Parameter values are contained in [1,|E|], where |E| denotes number of entities in the dataset. (This parameter MUST be defined by the user and is domain and data dependent).
+* MODEL_PARAM_MaxSupport: Specify maximal redescription support allowed. Parameter values are contained in [1,|E|], where |E| denotes number of entities in the dataset. (default is MODEL_PARAM_MaxSupport = |E|).
+* MODEL_PARAM_numRandomRestarts: Specify the number of random initialization steps performed by the CLUS-RM (the default is MODEL_PARAM_numRandomRestarts = 1).
+* MODEL_PARAM_numIterations: Specify the number of iterations (also called alternations) performed by the CLUS-RM (the default is MODEL_PARAM_numIterations = 10).
+* MODEL_PARAM_numRetRed: Specify the number of redescriptions to be returned by the CLUS-RM (the default is MODEL_PARAM_numRetRed = 50).
+* MODEL_PARAM_attributeImportanceW1: Specify the attribute importance, for attributes contained in view 1, used in constraint-based redescription mining (the default is MODEL_PARAM_attributeImportanceW1 = "none"). Possible values are: "none" - allow redescriptions with any attributes from view1, "suggested" - allow defining combinations of attributes that increase redescription score (redescriptions containing specified attributes are preferred), "soft" - only return redescriptions satisfying at least part of specified constraints to the user (redescriptions satisfying larger portion of constraint set are preferred), "hard" - only return redescriptions satisfying all constraints defined in one constraint set. 
+* MODEL_PARAM_attributeImportanceW2: Specify the attribute importance, for attributes contained in view 2, used in constraint-based redescription mining (the default is MODEL_PARAM_attributeImportanceW1 = "none"). Possible values are: "none" - allow redescriptions with any attributes from view2, "suggested" - allow defining combinations of attributes that increase redescription score (redescriptions containing specified attributes are preferred), "soft" - only return redescriptions satisfying at least part of specified constraints to the user (redescriptions satisfying larger portion of constraint set are preferred), "hard" - only return redescriptions satisfying all constraints defined in one constraint set. 
+* MODEL_PARAM_importantAttributesW1: defines constraint sets, for attributes contained in view 1, to be used in constraint-based redescription mining (default is MODEL_PARAM_importantAttributesW1=""). Constraints are specified in the format "{a;b;c},{a;d}", where a,b,c,d are some attributes contained in the first view (view1) of the data.
+* MODEL_PARAM_importantAttributesW2: defines constraint sets, for attributes contained in view 2, to be used in constraint-based redescription mining (default is MODEL_PARAM_importantAttributesW1=""). Constraints are specified in the format "{e;f;g},{h;i}", where e,f,g,h,i are some attributes contained in the second view (view2) of the data.
@@ -0,0 +1,32 @@
+#!/usr/bin/env bash
+
+set -o pipefail  # trace ERR through pipes
+set -o errtrace  # trace ERR through 'time command' and other functions
+set -o errexit   ## set -e : exit the script if any statement returns a non-true return value
+
+get_script_dir () {
+     SOURCE="${BASH_SOURCE[0]}"
+
+     while [ -h "$SOURCE" ]; do
+          DIR="$( cd -P "$( dirname "$SOURCE" )" && pwd )"
+          SOURCE="$( readlink "$SOURCE" )"
+          [[ $SOURCE != /* ]] && SOURCE="$DIR/$SOURCE"
+     done
+     cd -P "$( dirname "$SOURCE" )"
+     pwd
+}
+
+cd "$(get_script_dir)"
+
+if [[ $NO_SUDO || -n "$CIRCLECI" ]]; then
+  CAPTAIN="captain"
+elif groups $USER | grep &>/dev/null '\bdocker\b'; then
+  CAPTAIN="captain"
+else
+  CAPTAIN="sudo captain"
+fi
+
+BUILD_DATE=$(date -Iseconds) \
+  VCS_REF=$(git describe --tags --dirty) \
+  VERSION=$(git describe --tags --dirty) \
+  $CAPTAIN build
@@ -0,0 +1,7 @@
+target_image:
+  build: Dockerfile
+  image: hbpmip/java-jsi-clus-rm
+  pre:
+    - echo "Preparing java-jsi-clus-rm"
+  post:
+    - echo "Finished java-jsi-clus-rm"