Categories

Versions

You are viewing the RapidMiner Deployment documentation for version 9.6 - Check here for latest version

Deploy RapidMiner with easy Hadoop connectivity (single host)

The main purpose of the template defined below is to provide easy Hadoop connectivity.

It deploys RapidMiner on a single host with the following components:

Alternative templates are available from the templates page.

Instructions

To deploy the template, take the following steps:

  1. If you have not yet done so, install Docker.

  2. From the page below, copy the two files that define the docker-compose deployment to a folder on the server host:

  3. Connect to the server host (ssh), and change directory (cd) to the folder containing those two files.

  4. Deploy the template:

     docker-compose up -d
    

    Via this command, the Docker images will be automatically downloaded from Docker Hub (if they were not downloaded previously), and the services started.

Services

Once the deployment is running, the reverse proxy listens on the standard HTTP port (80) by default, as well as the HTTPS port (443), if an HTTPS certificate is configured. The deployment makes the following services / URLs available:

URL Description Default login credentials
http://<deployment-url> Login screen for RapidMiner Server Username: admin
Password: changeit
http://<deployment-url>/python-admin Python Environment Manager Username: admin
Password: changeit

The environment file (.env)

#
# Global parameters
#

REGISTRY=rapidminer/
AUTH_SECRET=TTY5MjUxbzRBN2ZIWThpNGVKNGo4V2xqOHk0dTNV
BROKER_ACTIVEMQ_USERNAME=amq-user
BROKER_ACTIVEMQ_PASSWORD=M69251o4A7fHY8i4eJ4j8Wlj8y4u3U
RAPIDMINER_SERVER_HOST=rm-server-svc
RAPIDMINER_SERVER_PORT=8080
RAPIDMINER_SERVER_URL=http://rm-server-svc:8080
TZ=UTC

#
# Rapidminer server
#

SERVER_VERSION=9.6.0
SERVER_DBHOST=rm-postgresql-svc
SERVER_DBSCHEMA=rapidminer-server-db
SERVER_DBUSER=rmserver-db-user
SERVER_DBPASS=w61J784XSb24K4LRV97MbE16i8xa9O
SERVER_MAX_MEMORY=2048M

#
# Job Agent
#

JOBAGENT_QUEUE_ACTIVEMQ_URI=failover:(tcp://rm-server-svc:5672)
JOBAGENT_CONTAINER_COUNT=2
JOB_QUEUE=DEFAULT
JOBAGENT_CONTAINER_MEMORYLIMIT=2048
RAPIDMINER_JOBAGENT_OPTS="-Djobagent.python.registryBaseUrl=http://pem-webui-svc:82/"

#
# Proxy
#

PROXY_VERSION=9.6.0
PEM_BACKEND=http://pem-webui-svc:82/
PEM_URL_SUFFIX=/python-admin
HTTPS_CRT_PATH=/rapidminer/uploaded/certs/validated_cert.crt
HTTPS_KEY_PATH=/rapidminer/uploaded/certs/validated_cert.key
HTTPS_DH_PATH=/rapidminer/uploaded/certs/dhparam.pem

#
# Radoop Proxy
#

RADOOP_PROXY_VERSION=1.2.1
# Authentication: 'server|jwt|superuser'
RADOOP_PROXY_AUTHENTICATION=superuser
RADOOP_PROXY_SUPERUSERNAME=proxyadmin
RADOOP_PROXY_SUPERUSERPASSWORD=changeit
RADOOP_PROXY_PORT=1081
RADOOP_PROXY_WORKERSPOOLSIZE=100
RADOOP_PROXY_SSL="off"

#
# Python environment manager
#
PEM_VERSION=9.6.0

The docker-compose definition (docker-compose.yml)

version: '3'
services:
  rm-proxy-svc:
    image: ${REGISTRY}rapidminer-proxy:${PROXY_VERSION}
    hostname: rm-proxy-svc
    restart: always
    environment:
      - RMSERVER_BACKEND=${RAPIDMINER_SERVER_URL}
      - PEM_BACKEND=${PEM_BACKEND}
      - PEM_URL_SUFFIX=${PEM_URL_SUFFIX}
      - HTTPS_CRT_PATH=${HTTPS_CRT_PATH}
      - HTTPS_KEY_PATH=${HTTPS_KEY_PATH}
      - HTTPS_DH_PATH=${HTTPS_DH_PATH}
      - DEBUG_CONF_INIT=false
    ports:
      - 80:80
      - 443:443
    networks:
      rm-platform-int-net:
        aliases:
          - rm-proxy-svc
    volumes:
      - ./ssl:/etc/nginx/ssl:ro
      - pem-uploaded-vol:/rapidminer/pem/uploaded/
  rm-postgresql-svc:
    image: postgres:9.6
    hostname: rm-postgresql-svc
    restart: always
    environment:
      - POSTGRES_DB=${SERVER_DBSCHEMA}
      - POSTGRES_USER=${SERVER_DBUSER}
      - POSTGRES_PASSWORD=${SERVER_DBPASS}
    volumes:
      - rm-postgresql-vol:/var/lib/postgresql/data
    networks:
      rm-platform-int-net:
        aliases:
          - rm-postgresql-svc
  rm-server-svc:
    image: ${REGISTRY}rapidminer-server:${SERVER_VERSION}
    hostname: rm-server-svc
    restart: always
    environment:
      - DBHOST=${SERVER_DBHOST}
      - DBSCHEMA=${SERVER_DBSCHEMA}
      - DBUSER=${SERVER_DBUSER}
      - DBPASS=${SERVER_DBPASS}
      - SERVER_MAX_MEMORY=${SERVER_MAX_MEMORY}
      - BROKER_ACTIVEMQ_USERNAME=${BROKER_ACTIVEMQ_USERNAME}
      - BROKER_ACTIVEMQ_PASSWORD=${BROKER_ACTIVEMQ_PASSWORD}
      - JOBSERVICE_AUTH_SECRET=${AUTH_SECRET}
      - TZ=${TZ}
    volumes:
      - rm-server-bootstrap-vol:/bootstrap.d
      - rm-server-home-vol:/persistent-rapidminer-home
    depends_on:
      - rm-postgresql-svc
    networks:
      rm-platform-int-net:
        aliases:
          - rm-server-svc
  rm-server-job-agent-svc:
    image: ${REGISTRY}rapidminer-execution-jobagent:${SERVER_VERSION}
    hostname: rm-server-job-agent-svc
    restart: always
    environment:
      - RMSERVER_HOST=${RAPIDMINER_SERVER_HOST}
      - JOBAGENT_QUEUE_ACTIVEMQ_URI=${JOBAGENT_QUEUE_ACTIVEMQ_URI}
      - JOBAGENT_QUEUE_ACTIVEMQ_USERNAME=${BROKER_ACTIVEMQ_USERNAME}
      - JOBAGENT_QUEUE_ACTIVEMQ_PASSWORD=${BROKER_ACTIVEMQ_PASSWORD}
      - JOBAGENT_AUTH_SECRET=${AUTH_SECRET}
      - JOBAGENT_CONTAINER_COUNT=${JOBAGENT_CONTAINER_COUNT}
      - JOB_QUEUE=${JOB_QUEUE}
      - JOBAGENT_CONTAINER_MEMORYLIMIT=${JOBAGENT_CONTAINER_MEMORYLIMIT}
      - RAPIDMINER_JOBAGENT_OPTS=${RAPIDMINER_JOBAGENT_OPTS}
      - TZ=${TZ}
    volumes:
      - rm-server-bootstrap-ja-vol:/bootstrap.d
    depends_on:
      - rm-server-svc
    networks:
      rm-platform-int-net:
        aliases:
          - rm-server-job-agent-svc
  pem-webui-svc:
    image: ${REGISTRY}python-environment-manager-webui:${PEM_VERSION}
    hostname: pem-webui-svc
    restart: always
    volumes:
      - pem-uploaded-vol:/var/www/html/uploaded/
    networks:
      rm-platform-int-net:
        aliases:
          - pem-webui-svc
  pem-cron-svc:
    image: ${REGISTRY}python-environment-manager-cron:${PEM_VERSION}
    hostname: pem-cron-svc
    restart: always
    volumes:
      - pem-cron-log-vol:/var/log/
      - pem-uploaded-vol:/rapidminer/uploaded/
      - /var/run/docker.sock:/var/run/docker.sock
    networks:
      rm-platform-int-net:
        aliases:
          - pem-cron-svc
  rm-radoop-proxy-svc:
    image: ${REGISTRY}radoop-proxy:${RADOOP_PROXY_VERSION}
    hostname: rm-radoop-proxy-svc
    restart: always
    environment:
      - AUTHENTICATION=${RADOOP_PROXY_AUTHENTICATION}
      - SUPERUSERNAME=${RADOOP_PROXY_SUPERUSERNAME}
      - SUPERUSERPASSWORD=${RADOOP_PROXY_SUPERUSERPASSWORD}
      - PORT=${RADOOP_PROXY_PORT}
      - WORKERSPOOLSIZE=${RADOOP_PROXY_WORKERSPOOLSIZE}
      - SSL=${RADOOP_PROXY_SSL}
      - SERVERHOST=${RAPIDMINER_SERVER_HOST}
      - SERVERPORT=${RAPIDMINER_SERVER_PORT}
    ports:
      - ${RADOOP_PROXY_PORT}:${RADOOP_PROXY_PORT}

volumes:
  rm-postgresql-vol:
  rm-server-bootstrap-vol:
  rm-server-home-vol:
  rm-server-bootstrap-ja-vol:
  pem-uploaded-vol:
  pem-cron-log-vol:

networks:
  rm-platform-int-net: