From e0ee4081491317ad19c9ce222753c889f28c176f Mon Sep 17 00:00:00 2001
From: Joseph D Natoli <joseph.d.natoli@intel.com>
Date: Thu, 19 Dec 2013 16:42:09 -0800
Subject: [PATCH] Adding IDH plugin basic implementation

Functionality:

* install and provision Intel Hadoop Manager and Intel Hadoop
* configure Intel Hadoop to use Cinder volumes as HDFS backend
* manual cluster scaling support
* Swift integration
* cluster configs - the same configs as in Vanilla Hadoop
* configs validation - the same as in Vanilla plugin

This is initial version. It doesn't cover bugs filed here:
https://bugs.launchpad.net/savanna/+bugs?field.searchtext=%7BIDH%5D

Co-Authored-By: Andrew Lazarev <alazarev@mirantis.com>

Implements blueprint idh-savanna-plugin

Change-Id: I70363869b61d73222d247b566d499c2fd6fb9201
---
 MANIFEST.in                                   |    1 +
 savanna/exceptions.py                         |    7 +
 savanna/plugins/intel/__init__.py             |    0
 savanna/plugins/intel/client/__init__.py      |    0
 savanna/plugins/intel/client/client.py        |   33 +
 savanna/plugins/intel/client/cluster.py       |   44 +
 savanna/plugins/intel/client/context.py       |   21 +
 savanna/plugins/intel/client/nodes.py         |   65 +
 savanna/plugins/intel/client/params.py        |   76 +
 savanna/plugins/intel/client/rest.py          |   78 +
 savanna/plugins/intel/client/services.py      |  137 +
 savanna/plugins/intel/client/session.py       |   49 +
 savanna/plugins/intel/config_helper.py        |  128 +
 savanna/plugins/intel/exceptions.py           |   31 +
 savanna/plugins/intel/installer.py            |  411 +++
 savanna/plugins/intel/plugin.py               |  173 ++
 .../plugins/intel/resources/configuration.xsd |  103 +
 .../intel/resources/hadoop-default.xml        | 1371 +++++++++
 .../plugins/intel/resources/hdfs-default.xml  | 1193 ++++++++
 .../intel/resources/mapred-default.xml        | 2678 +++++++++++++++++
 savanna/tests/unit/plugins/intel/__init__.py  |    0
 .../unit/plugins/intel/client/__init__.py     |    0
 .../unit/plugins/intel/client/response.py     |   28 +
 .../unit/plugins/intel/client/test_client.py  |  310 ++
 .../tests/unit/plugins/intel/test_plugin.py   |   61 +
 .../tests/unit/plugins/intel/test_utils.py    |   32 +
 .../test-default-with-type-and-locale.xml     |   43 +
 savanna/tests/unit/utils/test_xml_utils.py    |   18 +
 savanna/utils/xmlutils.py                     |   23 +-
 setup.cfg                                     |    1 +
 30 files changed, 7114 insertions(+), 1 deletion(-)
 create mode 100644 savanna/plugins/intel/__init__.py
 create mode 100644 savanna/plugins/intel/client/__init__.py
 create mode 100644 savanna/plugins/intel/client/client.py
 create mode 100644 savanna/plugins/intel/client/cluster.py
 create mode 100644 savanna/plugins/intel/client/context.py
 create mode 100644 savanna/plugins/intel/client/nodes.py
 create mode 100644 savanna/plugins/intel/client/params.py
 create mode 100644 savanna/plugins/intel/client/rest.py
 create mode 100644 savanna/plugins/intel/client/services.py
 create mode 100644 savanna/plugins/intel/client/session.py
 create mode 100644 savanna/plugins/intel/config_helper.py
 create mode 100644 savanna/plugins/intel/exceptions.py
 create mode 100644 savanna/plugins/intel/installer.py
 create mode 100644 savanna/plugins/intel/plugin.py
 create mode 100644 savanna/plugins/intel/resources/configuration.xsd
 create mode 100644 savanna/plugins/intel/resources/hadoop-default.xml
 create mode 100644 savanna/plugins/intel/resources/hdfs-default.xml
 create mode 100644 savanna/plugins/intel/resources/mapred-default.xml
 create mode 100644 savanna/tests/unit/plugins/intel/__init__.py
 create mode 100644 savanna/tests/unit/plugins/intel/client/__init__.py
 create mode 100644 savanna/tests/unit/plugins/intel/client/response.py
 create mode 100644 savanna/tests/unit/plugins/intel/client/test_client.py
 create mode 100644 savanna/tests/unit/plugins/intel/test_plugin.py
 create mode 100644 savanna/tests/unit/plugins/intel/test_utils.py
 create mode 100644 savanna/tests/unit/resources/test-default-with-type-and-locale.xml

diff --git a/MANIFEST.in b/MANIFEST.in
index 88d11b96..3c90fee1 100644
--- a/MANIFEST.in
+++ b/MANIFEST.in
@@ -9,6 +9,7 @@ include savanna/db/migration/alembic_migrations/versions/README
 
 recursive-include savanna/locale *
 
+include savanna/plugins/intel/resources/*.xml
 include savanna/plugins/vanilla/resources/*.xml
 include savanna/plugins/vanilla/resources/*.sh
 include savanna/plugins/vanilla/resources/*.sql
diff --git a/savanna/exceptions.py b/savanna/exceptions.py
index 40cbba35..ea142876 100644
--- a/savanna/exceptions.py
+++ b/savanna/exceptions.py
@@ -182,3 +182,10 @@ class ThreadException(SavannaException):
         self.message = "An error occurred in thread '%s': %s" % (
             thread_description, str(e))
         self.code = "THREAD_EXCEPTION"
+
+
+class NotImplementedException(SavannaException):
+    code = "NOT_IMPLEMENTED"
+
+    def __init__(self, feature):
+        self.message = "Feature '%s' is not implemented" % feature
diff --git a/savanna/plugins/intel/__init__.py b/savanna/plugins/intel/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/savanna/plugins/intel/client/__init__.py b/savanna/plugins/intel/client/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/savanna/plugins/intel/client/client.py b/savanna/plugins/intel/client/client.py
new file mode 100644
index 00000000..0617094b
--- /dev/null
+++ b/savanna/plugins/intel/client/client.py
@@ -0,0 +1,33 @@
+# Copyright (c) 2013 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from savanna.plugins.intel.client import cluster
+from savanna.plugins.intel.client import nodes
+from savanna.plugins.intel.client import params
+from savanna.plugins.intel.client import rest as r
+from savanna.plugins.intel.client import services
+
+
+class IntelClient():
+    def __init__(self, manager_ip, cluster_name):
+        #TODO(alazarev) make credentials configurable (bug #1262881)
+        self.rest = r.RESTClient(manager_ip, 'admin', 'admin')
+        self.cluster_name = cluster_name
+        self._ctx = self
+
+        self.cluster = cluster.Cluster(self)
+        self.nodes = nodes.Nodes(self)
+        self.params = params.Params(self)
+        self.services = services.Services(self)
diff --git a/savanna/plugins/intel/client/cluster.py b/savanna/plugins/intel/client/cluster.py
new file mode 100644
index 00000000..2cc62dac
--- /dev/null
+++ b/savanna/plugins/intel/client/cluster.py
@@ -0,0 +1,44 @@
+# Copyright (c) 2013 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from savanna.plugins.intel.client import context as c
+from savanna.plugins.intel.client import session
+
+
+class Cluster(c.IntelContext):
+    def create(self):
+        url = '/cluster'
+        data = {
+            'name': self.cluster_name,
+            'dnsresolution': True,
+            'acceptlicense': True
+        }
+
+        return self.rest.post(url, data)
+
+    def get(self):
+        url = '/cluster/%s' % self.cluster_name
+        return self.rest.get(url)
+
+    def install_software(self, nodes):
+        _nodes = [{'hostname': host} for host in nodes]
+        url = '/cluster/%s/nodes/commands/installsoftware' % self.cluster_name
+        session_id = self.rest.post(url, _nodes)['sessionID']
+        return session.wait(self, session_id)
+
+    def upload_authzkeyfile(self, authzkeyfile):
+        url = '/cluster/%s/upload/authzkey' % self.cluster_name
+        return self.rest.post(url,
+                              files={'file': authzkeyfile})['upload result']
diff --git a/savanna/plugins/intel/client/context.py b/savanna/plugins/intel/client/context.py
new file mode 100644
index 00000000..13897e8b
--- /dev/null
+++ b/savanna/plugins/intel/client/context.py
@@ -0,0 +1,21 @@
+# Copyright (c) 2013 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+
+class IntelContext(object):
+    def __init__(self, ctx):
+        self._ctx = ctx._ctx
+        self.cluster_name = ctx.cluster_name
+        self.rest = ctx.rest
diff --git a/savanna/plugins/intel/client/nodes.py b/savanna/plugins/intel/client/nodes.py
new file mode 100644
index 00000000..45cefcda
--- /dev/null
+++ b/savanna/plugins/intel/client/nodes.py
@@ -0,0 +1,65 @@
+# Copyright (c) 2013 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from savanna.plugins.intel.client import context as c
+from savanna.plugins.intel.client import session
+from savanna.plugins.intel import exceptions as iex
+
+
+class Nodes(c.IntelContext):
+    def add(self, nodes, rack, username, path_to_key, keypass=''):
+        hosts = {
+            'method': 'useauthzkeyfile',
+            'nodeinfo': map(lambda host: {
+                'hostname': host,
+                'username': username,
+                'passphrase': keypass,
+                'authzkeyfile': path_to_key,
+                'rackName': rack
+            }, nodes)
+        }
+
+        url = '/cluster/%s/nodes' % self.cluster_name
+        resp = self.rest.post(url, hosts)['items']
+
+        for node_info in resp:
+            if node_info['info'] != 'Connected':
+                raise iex.IntelPluginException(
+                    'Error adding nodes: %s' % node_info['iporhostname'])
+
+    def get(self):
+        url = '/cluster/%s/nodes' % self.cluster_name
+        return self.rest.get(url)
+
+    def get_status(self, node):
+        url = '/cluster/%s/nodes/%s' % (self.cluster_name, node)
+        return self.rest.get(url)['status']
+
+    def delete(self, node):
+        url = '/cluster/%s/nodes/%s' % (self.cluster_name, node)
+        return self.rest.delete(url)
+
+    def config(self, force=False):
+        url = ('/cluster/%s/nodes/commands/confignodes/%s'
+               % (self.cluster_name, 'force' if force else 'noforce'))
+
+        session_id = self.rest.post(url)['sessionID']
+        return session.wait(self, session_id)
+
+    def stop(self, nodes):
+        url = '/cluster/%s/nodes/commands/stopnodes' % self.cluster_name
+        data = [{'hostname': host} for host in nodes]
+
+        return self.rest.post(url, data)
diff --git a/savanna/plugins/intel/client/params.py b/savanna/plugins/intel/client/params.py
new file mode 100644
index 00000000..239bb70f
--- /dev/null
+++ b/savanna/plugins/intel/client/params.py
@@ -0,0 +1,76 @@
+# Copyright (c) 2013 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from savanna import exceptions
+from savanna.plugins.intel.client import context as c
+
+
+class BaseParams(c.IntelContext):
+    def __init__(self, ctx, service):
+        super(BaseParams, self).__init__(ctx)
+        self.service = service
+
+    def add(self, item, value, desc=''):
+        data = {
+            'editdesc': desc,
+            'items': [
+                {
+                    'type': self.service,
+                    'item': item,
+                    'value': value,
+                    'desc': desc
+                }
+            ]
+        }
+        url = ('/cluster/%s/configuration/%s'
+               % (self.cluster_name, self.service))
+        return self.rest.post(url, data)
+
+    def update(self, item, value, desc='', nodes=None):
+        data = {
+            'editdesc': desc,
+            'items': [
+                {
+                    'type': self.service,
+                    'item': item,
+                    'value': value
+                }
+            ]
+        }
+        if nodes:
+            data = {
+                'editdesc': desc,
+                'items': map(lambda node: {
+                    'type': self.service,
+                    'item': item,
+                    'value': value,
+                    'hostname': node
+                }, nodes)
+            }
+
+        url = ('/cluster/%s/configuration/%s'
+               % (self.cluster_name, self.service))
+        return self.rest.put(url, data)
+
+    def get(self, hosts, item):
+        raise exceptions.NotImplementedException("BaseParams.get")
+
+
+class Params(c.IntelContext):
+    def __init__(self, ctx):
+        super(Params, self).__init__(ctx)
+        self.hadoop = BaseParams(self, 'hadoop')
+        self.hdfs = BaseParams(self, 'hdfs')
+        self.mapred = BaseParams(self, 'mapred')
diff --git a/savanna/plugins/intel/client/rest.py b/savanna/plugins/intel/client/rest.py
new file mode 100644
index 00000000..19ebc1fa
--- /dev/null
+++ b/savanna/plugins/intel/client/rest.py
@@ -0,0 +1,78 @@
+# Copyright (c) 2013 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import json
+import requests
+from requests import auth
+
+from savanna.openstack.common import log as logging
+from savanna.plugins.intel import exceptions as iex
+
+
+LOG = logging.getLogger(__name__)
+
+
+class RESTClient():
+    def __init__(self, manager_ip, auth_username, auth_password):
+        #TODO(alazarev) make port configurable (bug #1262895)
+        self.base_url = ('https://%s:9443/restapi/intelcloud/api/v1'
+                         % manager_ip)
+        LOG.debug("Connecting to manager with URL of %s", self.base_url)
+
+        self.auth = auth.HTTPBasicAuth(auth_username, auth_password)
+
+    def get(self, url):
+        url = self.base_url + url
+        LOG.debug("Sending GET to URL of %s", url)
+        r = requests.get(url, verify=False, auth=self.auth)
+        return self._check_response(r)
+
+    def post(self, url, data=None, files=None):
+        url = self.base_url + url
+        LOG.debug("Sending POST to URL '%s' (%s files): %s", url,
+                  len(files) if files else 0,
+                  data if data else 'no data')
+        r = requests.post(url, data=json.dumps(data) if data else None,
+                          verify=False, auth=self.auth, files=files)
+        return self._check_response(r)
+
+    def delete(self, url):
+        url = self.base_url + url
+        LOG.debug("Sending DELETE to URL of %s", url)
+        r = requests.delete(url, verify=False, auth=self.auth)
+        return self._check_response(r)
+
+    def put(self, url, data=None):
+        url = self.base_url + url
+        if data:
+            LOG.debug("Sending PUT to URL of %s: %s", url, data)
+            r = requests.put(url, data=json.dumps(data), verify=False,
+                             auth=self.auth)
+        else:
+            LOG.debug("Sending PUT to URL of %s with no data", url)
+            r = requests.put(url, verify=False, auth=self.auth)
+
+        return self._check_response(r)
+
+    def _check_response(self, resp):
+        LOG.debug("Response with HTTP code %s, and content of %s",
+                  resp.status_code, resp.text)
+        if not resp.ok:
+            raise iex.IntelPluginException(
+                "Request to manager returned with code '%s', reason '%s' "
+                "and message '%s'" % (resp.status_code, resp.reason,
+                                      json.loads(resp.text)['message']))
+        else:
+            return json.loads(resp.text)
diff --git a/savanna/plugins/intel/client/services.py b/savanna/plugins/intel/client/services.py
new file mode 100644
index 00000000..bc8d1e74
--- /dev/null
+++ b/savanna/plugins/intel/client/services.py
@@ -0,0 +1,137 @@
+# Copyright (c) 2013 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from savanna import context
+from savanna.openstack.common import log as logging
+from savanna.plugins.intel.client import context as c
+from savanna.plugins.intel.client import session
+from savanna.plugins.intel import exceptions as iex
+
+LOG = logging.getLogger(__name__)
+
+
+class BaseService(c.IntelContext):
+    def __init__(self, ctx, service_name):
+        super(BaseService, self).__init__(ctx)
+        self.service = service_name
+
+    def start(self):
+        url = ('/cluster/%s/services/%s/commands/start'
+               % (self.cluster_name, self.service))
+
+        self.rest.post(url)
+
+        timeout = 120
+        cur_time = 0
+        while cur_time < timeout:
+            context.sleep(2)
+            if self.status() == 'running':
+                break
+            else:
+                cur_time += 2
+        else:
+            raise iex.IntelPluginException(
+                "Service '%s' has failed to start in %s seconds"
+                % (self.service, timeout))
+
+    def stop(self):
+        url = ('/cluster/%s/services/%s/commands/stop'
+               % (self.cluster_name, self.service))
+
+        return self.rest.post(url)
+
+    def status(self):
+        url = '/cluster/%s/services' % self.cluster_name
+        statuses = self.rest.get(url)['items']
+        for st in statuses:
+            if st['serviceName'] == self.service:
+                return st['status']
+
+        raise iex.IntelPluginException(
+            "Service '%s' is not installed on cluster '%s'"
+            % (self.service, self.cluster_name))
+
+    def get_nodes(self):
+        url = '/cluster/%s/services/%s' % (self.cluster_name, self.service)
+        return self.rest.get(url)
+
+    def add_nodes(self, role, nodes):
+        url = ('/cluster/%s/services/%s/roles'
+               % (self.cluster_name, self.service))
+
+        data = map(lambda host: {
+            'rolename': role,
+            'hostname': host
+        }, nodes)
+
+        return self.rest.post(url, data)
+
+
+class HDFSService(BaseService):
+    def format(self, force=False):
+        url = ('/cluster/%s/services/hdfs/commands/hdfsformat/%s'
+               % (self.cluster_name, 'force' if force else 'noforce'))
+
+        session_id = self.rest.post(url)['sessionID']
+        return session.wait(self, session_id)
+
+    def decommission_nodes(self, nodes, force=False):
+        url = ('/cluster/%s/nodes/commands/decommissionnodes/%s'
+               % (self.cluster_name, 'force' if force else 'noforce'))
+        data = map(lambda host: {
+            'hostname': host
+        }, nodes)
+
+        return self.rest.post(url, data)
+
+    def get_datanodes_status(self):
+        url = '/cluster/%s/nodes/commands/datanodes/status' % self.cluster_name
+        return self.rest.get(url)['items']
+
+    def get_datanode_status(self, datanode):
+        stats = self.get_datanodes_status()
+        for stat in stats:
+            if stat['hostname'] == datanode:
+                return stat['status'].strip()
+
+        raise iex.IntelPluginException(
+            "Datanode service is is not installed on node '%s'" % datanode)
+
+
+class Services(c.IntelContext):
+    def __init__(self, ctx):
+        super(Services, self).__init__(ctx)
+        self.hdfs = HDFSService(self, 'hdfs')
+        self.mapred = BaseService(self, 'mapred')
+        self.hive = BaseService(self, 'hive')
+        self.oozie = BaseService(self, 'oozie')
+
+    def add(self, services):
+        _services = map(lambda service: {
+            'serviceName': service,
+            'type': service
+        }, services)
+        url = '/cluster/%s/services' % self.cluster_name
+
+        return self.rest.post(url, _services)
+
+    def get_services(self):
+        url = '/cluster/%s/services' % self.cluster_name
+
+        return self.rest.get(url)
+
+    def delete_service(self, service):
+        url = '/cluster/%s/services/%s' % (self.cluster_name, service)
+        return self.rest.delete(url)
diff --git a/savanna/plugins/intel/client/session.py b/savanna/plugins/intel/client/session.py
new file mode 100644
index 00000000..d4b02342
--- /dev/null
+++ b/savanna/plugins/intel/client/session.py
@@ -0,0 +1,49 @@
+# Copyright (c) 2013 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from savanna import context
+from savanna.openstack.common import log as logging
+from savanna.plugins.intel import exceptions as iex
+
+LOG = logging.getLogger(__name__)
+
+
+def get(ctx, session_id):
+    url = '/cluster/%s/session/%s' % (ctx.cluster_name, session_id)
+    return ctx.rest.get(url)
+
+
+def wait(ctx, session_id):
+    #TODO(lazarev) add check on savanna cluster state (exit on delete)
+    #TODO(alazarev) make configurable (bug #1262897)
+    timeout = 4*60*60  # 4 hours
+    cur_time = 0
+    while cur_time < timeout:
+        info_items = get(ctx, session_id)['items']
+        for item in info_items:
+            progress = item['nodeprogress']
+            if progress['info'].strip() == '_ALLFINISH':
+                return
+            else:
+                context.sleep(10)
+                cur_time += 10
+
+            debug_msg = 'Hostname: %s\nInfo: %s'
+            debug_msg = debug_msg % (progress['hostname'], progress['info'])
+            LOG.debug(debug_msg)
+    else:
+        raise iex.IntelPluginException(
+            "Cluster '%s' has failed to start in %s minutes"
+            % (ctx.cluster_name, timeout / 60))
diff --git a/savanna/plugins/intel/config_helper.py b/savanna/plugins/intel/config_helper.py
new file mode 100644
index 00000000..9b4cefee
--- /dev/null
+++ b/savanna/plugins/intel/config_helper.py
@@ -0,0 +1,128 @@
+# Copyright (c) 2013 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from savanna.plugins import provisioning as p
+from savanna.utils import xmlutils as x
+
+
+CORE_DEFAULT = x.load_hadoop_xml_defaults_with_type_and_locale(
+    'plugins/intel/resources/hadoop-default.xml')
+
+HDFS_DEFAULT = x.load_hadoop_xml_defaults_with_type_and_locale(
+    'plugins/intel/resources/hdfs-default.xml')
+
+MAPRED_DEFAULT = x.load_hadoop_xml_defaults_with_type_and_locale(
+    'plugins/intel/resources/mapred-default.xml')
+
+XML_CONFS = {
+    "Hadoop": [CORE_DEFAULT],
+    "HDFS": [HDFS_DEFAULT],
+    "MapReduce": [MAPRED_DEFAULT]
+}
+
+IDH_TARBALL_URL = p.Config('IDH tarball URL', 'general', 'cluster', priority=1,
+                           default_value='http://repo1.intelhadoop.com:3424/'
+                                         'setup/setup-intelhadoop-'
+                                         '2.5.1-en-evaluation.RHEL.tar.gz')
+
+OS_REPO_URL = p.Config('OS repository URL', 'general', 'cluster', priority=1,
+                       is_optional=True,
+                       default_value='http://mirror.centos.org/'
+                                     'centos-6/6/os/x86_64')
+
+IDH_REPO_URL = p.Config('IDH repository URL', 'general', 'cluster',
+                        priority=1, is_optional=True,
+                        default_value='http://repo1.intelhadoop.com:3424'
+                                      '/evaluation/en/RHEL/2.5.1/rpm')
+
+ENABLE_SWIFT = p.Config('Enable Swift', 'general', 'cluster',
+                        config_type="bool", priority=1,
+                        default_value=True, is_optional=True)
+
+HIDDEN_CONFS = ['fs.default.name', 'dfs.name.dir', 'dfs.data.dir',
+                'mapred.job.tracker', 'mapred.system.dir', 'mapred.local.dir']
+
+CLUSTER_WIDE_CONFS = ['dfs.block.size', 'dfs.permissions', 'dfs.replication',
+                      'dfs.replication.min', 'dfs.replication.max',
+                      'io.file.buffer.size', 'mapreduce.job.counters.max',
+                      'mapred.output.compress', 'io.compression.codecs',
+                      'mapred.output.compression.codec',
+                      'mapred.output.compression.type',
+                      'mapred.compress.map.output',
+                      'mapred.map.output.compression.codec']
+
+PRIORITY_1_CONFS = ['dfs.datanode.du.reserved',
+                    'dfs.datanode.failed.volumes.tolerated',
+                    'dfs.datanode.max.xcievers', 'dfs.datanode.handler.count',
+                    'dfs.namenode.handler.count', 'mapred.child.java.opts',
+                    'mapred.jobtracker.maxtasks.per.job',
+                    'mapred.job.tracker.handler.count',
+                    'mapred.map.child.java.opts',
+                    'mapred.reduce.child.java.opts',
+                    'io.sort.mb', 'mapred.tasktracker.map.tasks.maximum',
+                    'mapred.tasktracker.reduce.tasks.maximum']
+
+PRIORITY_1_CONFS += CLUSTER_WIDE_CONFS
+
+CFG_TYPE = {
+    "Boolean": "bool",
+    "String": "string",
+    "Integer": "int",
+    "Choose": "string",
+    "Class": "string",
+    "Directory": "string",
+    "Float": "string",
+    "Int_range": "string",
+}
+
+
+def _initialise_configs():
+    configs = []
+
+    for service, config_lists in XML_CONFS.iteritems():
+        for config_list in config_lists:
+            for config in config_list:
+                if config['name'] not in HIDDEN_CONFS:
+                    cfg = p.Config(
+                        config['name'], service, "cluster", is_optional=True,
+                        config_type="string",
+                        default_value=str(config['value']),
+                        description=config['description'])
+
+                    if config.get('type'):
+                        cfg.config_type = CFG_TYPE[config['type']]
+                    if cfg.config_type == 'bool':
+                        cfg.default_value = cfg.default_value == 'true'
+                    if cfg.config_type == 'int':
+                        if cfg.default_value:
+                            cfg.default_value = int(cfg.default_value)
+                        else:
+                            cfg.config_type = 'string'
+                    if config['name'] in PRIORITY_1_CONFS:
+                        cfg.priority = 1
+                    configs.append(cfg)
+
+    configs.append(IDH_TARBALL_URL)
+    configs.append(IDH_REPO_URL)
+    configs.append(OS_REPO_URL)
+    configs.append(ENABLE_SWIFT)
+    return configs
+
+
+PLUGIN_CONFIGS = _initialise_configs()
+
+
+def get_plugin_configs():
+    return PLUGIN_CONFIGS
diff --git a/savanna/plugins/intel/exceptions.py b/savanna/plugins/intel/exceptions.py
new file mode 100644
index 00000000..fccb5500
--- /dev/null
+++ b/savanna/plugins/intel/exceptions.py
@@ -0,0 +1,31 @@
+# Copyright (c) 2013 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import savanna.exceptions as e
+
+
+class NotSingleManagerException(e.SavannaException):
+    message = "Intel hadoop cluster should contain only 1 Intel " \
+              "Manager instance. Actual manager count is %s"
+
+    def __init__(self, mng_count):
+        self.message = self.message % mng_count
+        self.code = "NOT_SINGLE_MANAGER"
+
+
+class IntelPluginException(e.SavannaException):
+    def __init__(self, message):
+        self.message = message
+        self.code = "INTEL_PLUGIN_EXCEPTION"
diff --git a/savanna/plugins/intel/installer.py b/savanna/plugins/intel/installer.py
new file mode 100644
index 00000000..3d1eca90
--- /dev/null
+++ b/savanna/plugins/intel/installer.py
@@ -0,0 +1,411 @@
+# Copyright (c) 2013 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import six
+import telnetlib
+
+from savanna import conductor
+from savanna import context
+from savanna.openstack.common import log as logging
+from savanna.plugins.general import utils as u
+from savanna.plugins.intel.client import client as c
+from savanna.plugins.intel import config_helper as c_helper
+from savanna.plugins.intel import exceptions as iex
+from savanna.swift import swift_helper as swift
+from savanna.utils import crypto
+
+
+conductor = conductor.API
+LOG = logging.getLogger(__name__)
+
+_INST_CONF_TEMPLATE = """
+network_interface=eth0
+mode=silent
+accept_jdk_license=accept
+how_to_setup_os_repo=2
+os_repo=%s
+os_repo_username=
+os_repo_password=
+os_repo_proxy=
+how_to_setup_idh_repo=1
+idh_repo=%s
+idh_repo_username=
+idh_repo_password=
+idh_repo_proxy=
+firewall_selinux_setting=1"""
+
+SWIFT_LIB_URL = \
+    'http://savanna-files.mirantis.com/hadoop-swift/hadoop-swift-latest.jar'
+
+
+def install_manager(cluster):
+    LOG.info("Starting Install Manager Process")
+    mng_instance = u.get_instance(cluster, 'manager')
+
+    idh_tarball_path = \
+        cluster.cluster_configs['general'].get('IDH tarball URL')
+    if not idh_tarball_path:
+        idh_tarball_path = c_helper.IDH_TARBALL_URL.default_value
+
+    idh_tarball_filename = idh_tarball_path.rsplit('/', 1)[-1]
+    idh_dir = idh_tarball_filename[:idh_tarball_filename.find('.tar.gz')]
+    LOG.info("IDH tgz will be retrieved from: \'%s\'", idh_tarball_path)
+
+    idh_repo = cluster.cluster_configs['general'].get('IDH repository URL')
+    if not idh_repo:
+        idh_repo = c_helper.IDH_REPO_URL.default_value
+
+    os_repo = cluster.cluster_configs['general'].get('OS repository URL')
+    if not os_repo:
+        os_repo = c_helper.OS_REPO_URL.default_value
+
+    idh_install_cmd = 'sudo ./%s/install.sh --mode=silent 2>&1' % idh_dir
+
+    with mng_instance.remote() as r:
+        LOG.info("Download IDH manager ")
+        try:
+            r.execute_command('curl -O %s 2>&1' % idh_tarball_path)
+        except Exception as e:
+            raise RuntimeError("Unable to download IDH manager from %s",
+                               idh_tarball_path, e)
+
+        # unpack archive
+        LOG.info("Unpack manager %s ", idh_tarball_filename)
+        try:
+            r.execute_command('tar xzf %s 2>&1' % idh_tarball_filename)
+        except Exception as e:
+            raise RuntimeError("Unable to unpack tgz %s",
+                               idh_tarball_filename, e)
+
+        # install idh
+        LOG.debug("Install manager with %s : ", idh_install_cmd)
+        inst_conf = _INST_CONF_TEMPLATE % (os_repo, idh_repo)
+        r.write_file_to('%s/ui-installer/conf' % idh_dir, inst_conf)
+        #TODO(alazarev) make timeout configurable (bug #1262897)
+        r.execute_command(idh_install_cmd, timeout=3600)
+
+        # fix nginx persimmions bug
+        r.execute_command('sudo chmod o+x /var/lib/nginx/ /var/lib/nginx/tmp '
+                          '/var/lib/nginx/tmp/client_body')
+
+    # waiting start idh manager
+    #TODO(alazarev) make timeout configurable (bug #1262897)
+    timeout = 600
+    LOG.debug("Waiting %s seconds for Manager to start : ", timeout)
+    while timeout:
+        try:
+            telnetlib.Telnet(mng_instance.management_ip, 9443)
+            break
+        except IOError:
+            timeout -= 2
+            context.sleep(2)
+    else:
+        message = ("IDH Manager failed to start in %s minutes on node '%s' "
+                   "of cluster '%s'"
+                   % (timeout / 60, mng_instance.management_ip, cluster.name))
+        LOG.error(message)
+        raise iex.IntelPluginException(message)
+
+
+def configure_os(cluster):
+    instances = u.get_instances(cluster)
+    configure_os_from_instances(cluster, instances)
+
+
+def create_hadoop_ssh_keys(cluster):
+    private_key, public_key = crypto.generate_key_pair()
+    extra = {
+        'hadoop_private_ssh_key': private_key,
+        'hadoop_public_ssh_key': public_key
+    }
+    return conductor.cluster_update(context.ctx(), cluster, {'extra': extra})
+
+
+def configure_os_from_instances(cluster, instances):
+    for instance in instances:
+        with instance.remote() as remote:
+            LOG.debug("Configuring OS settings on %s : ", instance.hostname())
+
+            # configure hostname, RedHat/Centos specific
+            remote.replace_remote_string('/etc/sysconfig/network',
+                                         'HOSTNAME=.*',
+                                         'HOSTNAME=%s' % instance.hostname())
+            # disable selinux and iptables, because Intel distribution requires
+            # this to be off
+            remote.execute_command('sudo /usr/sbin/setenforce 0')
+            remote.replace_remote_string('/etc/selinux/config',
+                                         'SELINUX=.*', 'SELINUX=disabled')
+            # disable iptables
+            remote.execute_command('sudo /sbin/service iptables stop')
+            remote.execute_command('sudo /sbin/chkconfig iptables off')
+
+            # create 'hadoop' user
+            remote.write_files_to({
+                'id_rsa': cluster.extra.get('hadoop_private_ssh_key'),
+                'authorized_keys': cluster.extra.get('hadoop_public_ssh_key')
+            })
+            remote.execute_command(
+                'sudo useradd hadoop && '
+                'sudo sh -c \'echo "hadoop ALL=(ALL) NOPASSWD:ALL" '
+                '>> /etc/sudoers\' && '
+                'sudo mkdir -p /home/hadoop/.ssh/ && '
+                'sudo mv id_rsa authorized_keys /home/hadoop/.ssh && '
+                'sudo chown -R hadoop:hadoop /home/hadoop/.ssh && '
+                'sudo chmod 600 /home/hadoop/.ssh/{id_rsa,authorized_keys}')
+
+            swift_enable = \
+                cluster.cluster_configs['general'].get('Enable Swift')
+            if not swift_enable:
+                swift_enable = c_helper.ENABLE_SWIFT.default_value
+
+            if swift_enable:
+                swift_lib_path = '/usr/lib/hadoop/lib/hadoop-swift-latest.jar'
+                cmd = ('sudo curl \'%s\' -o %s --create-dirs'
+                       % (SWIFT_LIB_URL, swift_lib_path))
+                remote.execute_command(cmd)
+
+
+def _configure_services(client, cluster):
+    nn_host = u.get_namenode(cluster).hostname()
+    snn = u.get_secondarynamenodes(cluster)
+    snn_host = snn[0].hostname() if snn else None
+    jt_host = u.get_jobtracker(cluster).hostname()
+    dn_hosts = [dn.hostname() for dn in u.get_datanodes(cluster)]
+    tt_hosts = [tt.hostname() for tt in u.get_tasktrackers(cluster)]
+
+    oozie_host = u.get_oozie(cluster).hostname() if u.get_oozie(
+        cluster) else None
+    hive_host = u.get_hiveserver(cluster).hostname() if u.get_hiveserver(
+        cluster) else None
+
+    services = []
+    if u.get_namenode(cluster):
+        services += ['hdfs']
+
+    if u.get_jobtracker(cluster):
+        services += ['mapred']
+
+    if oozie_host:
+        services += ['oozie']
+
+    if hive_host:
+        services += ['hive']
+
+    LOG.debug("Add services: %s" % ', '.join(services))
+    client.services.add(services)
+
+    LOG.debug("Assign roles to hosts")
+    client.services.hdfs.add_nodes('PrimaryNameNode', [nn_host])
+
+    client.services.hdfs.add_nodes('DataNode', dn_hosts)
+    if snn:
+        client.services.hdfs.add_nodes('SecondaryNameNode', [snn_host])
+
+    if oozie_host:
+        client.services.oozie.add_nodes('Oozie', [oozie_host])
+
+    if hive_host:
+        client.services.hive.add_nodes('HiveServer', [hive_host])
+
+    client.services.mapred.add_nodes('JobTracker', [jt_host])
+    client.services.mapred.add_nodes('TaskTracker', tt_hosts)
+
+
+def _configure_storage(client, cluster):
+    datanode_ng = u.get_node_groups(cluster, 'datanode')[0]
+    storage_paths = datanode_ng.storage_paths()
+    dn_hosts = [i.hostname() for i in u.get_datanodes(cluster)]
+
+    name_dir_param = ",".join(
+        [st_path + '/dfs/name' for st_path in storage_paths])
+    data_dir_param = ",".join(
+        [st_path + '/dfs/data' for st_path in storage_paths])
+    client.params.hdfs.update('dfs.name.dir', name_dir_param)
+    client.params.hdfs.update('dfs.data.dir', data_dir_param, nodes=dn_hosts)
+
+
+def _configure_swift(client, cluster):
+    swift_enable = cluster.cluster_configs['general'].get('Enable Swift')
+    if swift_enable is None or swift_enable:
+        swift_configs = swift.get_swift_configs()
+        for conf in swift_configs:
+            client.params.hadoop.add(conf['name'], conf['value'])
+
+
+def _add_user_params(client, cluster):
+    for p in six.iteritems(cluster.cluster_configs["Hadoop"]):
+        client.params.hadoop.update(p[0], p[1])
+
+    for p in six.iteritems(cluster.cluster_configs["HDFS"]):
+        client.params.hdfs.update(p[0], p[1])
+
+    for p in six.iteritems(cluster.cluster_configs["MapReduce"]):
+        client.params.mapred.update(p[0], p[1])
+
+
+def install_cluster(cluster):
+    mng_instance = u.get_instance(cluster, 'manager')
+    mng_ip = mng_instance.management_ip
+
+    all_hosts = list(set([i.hostname() for i in u.get_instances(cluster)]))
+
+    client = c.IntelClient(mng_ip, cluster.name)
+
+    LOG.info("Create cluster")
+    client.cluster.create()
+
+    LOG.info("Add nodes to cluster")
+    rack = '/Default'
+    client.nodes.add(all_hosts, rack, 'hadoop',
+                     '/home/hadoop/.ssh/id_rsa')
+
+    LOG.info("Install software")
+    client.cluster.install_software(all_hosts)
+
+    LOG.info("Configure services")
+    _configure_services(client, cluster)
+
+    LOG.info("Deploy cluster")
+    client.nodes.config(force=True)
+
+    LOG.info("Provisioning configs")
+    # cinder and ephemeral drive support
+    _configure_storage(client, cluster)
+    # swift support
+    _configure_swift(client, cluster)
+    # user configs
+    _add_user_params(client, cluster)
+
+    LOG.info("Format HDFS")
+    client.services.hdfs.format()
+
+
+def start_cluster(cluster):
+    client = c.IntelClient(
+        u.get_instance(cluster, 'manager').management_ip, cluster.name)
+
+    LOG.debug("Starting hadoop services")
+    client.services.hdfs.start()
+
+    client.services.mapred.start()
+    if u.get_hiveserver(cluster):
+        client.services.hive.start()
+
+    if u.get_oozie(cluster):
+        client.services.oozie.start()
+
+
+def scale_cluster(cluster, instances):
+    scale_ins_hosts = [i.hostname() for i in instances]
+    dn_hosts = [dn.hostname() for dn in u.get_datanodes(cluster)]
+    tt_hosts = [tt.hostname() for tt in u.get_tasktrackers(cluster)]
+    to_scale_dn = []
+    to_scale_tt = []
+    for i in scale_ins_hosts:
+        if i in dn_hosts:
+            to_scale_dn.append(i)
+
+        if i in tt_hosts:
+            to_scale_tt.append(i)
+
+    mng_ip = u.get_instance(cluster, 'manager').management_ip
+    client = c.IntelClient(mng_ip, cluster.name)
+    rack = '/Default'
+    client.nodes.add(scale_ins_hosts, rack, 'hadoop',
+                     cluster.extra['manager_authzkeyfile_path'])
+    client.cluster.install_software(scale_ins_hosts)
+
+    if to_scale_tt:
+        client.services.mapred.add_nodes('TaskTracker', to_scale_tt)
+
+    if to_scale_dn:
+        client.services.hdfs.add_nodes('DataNode', to_scale_dn)
+
+    client.nodes.config()
+
+    if to_scale_dn:
+        client.services.hdfs.start()
+
+    if to_scale_tt:
+        client.services.mapred.start()
+
+
+def decommission_nodes(cluster, instances):
+    dec_hosts = [i.hostname() for i in instances]
+    dn_hosts = [dn.hostname() for dn in u.get_datanodes(cluster)]
+    tt_hosts = [dn.hostname() for dn in u.get_tasktrackers(cluster)]
+
+    mng_ip = u.get_instances(cluster, 'manager')[0].management_ip
+    client = c.IntelClient(mng_ip, cluster.name)
+
+    dec_dn_hosts = []
+    for dec_host in dec_hosts:
+        if dec_host in dn_hosts:
+            dec_dn_hosts.append(dec_host)
+
+    if dec_dn_hosts:
+        client.services.hdfs.decommission_nodes(dec_dn_hosts)
+
+        #TODO(alazarev) make timeout configurable (bug #1262897)
+        timeout = 14400  # 4 hours
+        cur_time = 0
+        for host in dec_dn_hosts:
+            while cur_time < timeout:
+                if client.services.hdfs.get_datanode_status(
+                        host) == 'Decomissioned':
+                    break
+                context.sleep(5)
+                cur_time += 5
+            else:
+                LOG.warn("Failed to decomission node '%s' of cluster '%s' "
+                         "in %s minutes" % (host, cluster.name, timeout/60))
+
+    client.nodes.stop(dec_hosts)
+
+    # wait stop services
+    #TODO(alazarev) make timeout configurable (bug #1262897)
+    timeout = 600  # 10 minutes
+    cur_time = 0
+    for instance in instances:
+        while cur_time < timeout:
+            stopped = True
+            if instance.hostname() in dn_hosts:
+                code, out = instance.remote().execute_command(
+                    'sudo /sbin/service hadoop-datanode status',
+                    raise_when_error=False)
+                if out.strip() != 'datanode is stopped':
+                    stopped = False
+                if out.strip() == 'datanode dead but pid file exists':
+                    instance.remote().execute_command(
+                        'sudo rm -f '
+                        '/var/run/hadoop/hadoop-hadoop-datanode.pid')
+            if instance.hostname() in tt_hosts:
+                code, out = instance.remote().execute_command(
+                    'sudo /sbin/service hadoop-tasktracker status',
+                    raise_when_error=False)
+                if out.strip() != 'tasktracker is stopped':
+                    stopped = False
+            if stopped:
+                break
+            else:
+                context.sleep(5)
+                cur_time += 5
+        else:
+            LOG.warn("Failed to stop services on node '%s' of cluster '%s' "
+                     "in %s minutes" % (instance, cluster.name, timeout/60))
+
+    for node in dec_hosts:
+        LOG.info("Deleting node '%s' on cluster '%s'" % (node, cluster.name))
+        client.nodes.delete(node)
diff --git a/savanna/plugins/intel/plugin.py b/savanna/plugins/intel/plugin.py
new file mode 100644
index 00000000..3a2fcde9
--- /dev/null
+++ b/savanna/plugins/intel/plugin.py
@@ -0,0 +1,173 @@
+# Copyright (c) 2013 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from savanna import conductor
+from savanna import context
+from savanna.openstack.common import log as logging
+from savanna.plugins.general import exceptions as ex
+from savanna.plugins.general import utils as u
+from savanna.plugins.intel import config_helper as c_helper
+from savanna.plugins.intel import exceptions as i_ex
+from savanna.plugins.intel import installer as ins
+from savanna.plugins import provisioning as p
+
+conductor = conductor.API
+LOG = logging.getLogger(__name__)
+
+
+class IDHProvider(p.ProvisioningPluginBase):
+    def __init__(self):
+        self.processes = {
+            "Manager": ["manager"],
+            "HDFS": ["namenode", "datanode", "secondarynamenode"],
+            "MapReduce": ["jobtracker", "tasktracker"],
+            "Hadoop": []   # for hadoop parameters in UI
+        }
+
+    def get_description(self):
+        return \
+            'The IDH OpenStack plugin works with project ' \
+            'Savanna to automate the deployment of the Intel Distribution ' \
+            'of Apache Hadoop on OpenStack based ' \
+            'public & private clouds'
+
+    def get_node_processes(self, hadoop_version):
+        return self.processes
+
+    def get_versions(self):
+        return ['2.5.1']
+
+    def get_title(self):
+        return "Intel(R) Distribution for Apache Hadoop* Software"
+
+    def get_configs(self, hadoop_version):
+        return c_helper.get_plugin_configs()
+
+    def get_hive_config_path(self):
+        return '/etc/hive/conf/hive-site.xml'
+
+    def configure_cluster(self, cluster):
+        LOG.info("Configure IDH cluster")
+        cluster = ins.create_hadoop_ssh_keys(cluster)
+        ins.configure_os(cluster)
+        ins.install_manager(cluster)
+        ins.install_cluster(cluster)
+
+    def start_cluster(self, cluster):
+        LOG.info("Start IDH cluster")
+        ins.start_cluster(cluster)
+        self._set_cluster_info(cluster)
+
+    def validate(self, cluster):
+        nn_count = sum([ng.count for ng
+                        in u.get_node_groups(cluster, 'namenode')])
+        if nn_count != 1:
+            raise ex.NotSingleNameNodeException(nn_count)
+
+        jt_count = sum([ng.count for ng
+                        in u.get_node_groups(cluster, 'jobtracker')])
+        if jt_count > 1:
+            raise ex.NotSingleJobTrackerException(jt_count)
+
+        tt_count = sum([ng.count for ng
+                        in u.get_node_groups(cluster, 'tasktracker')])
+        if jt_count == 0 and tt_count > 0:
+            raise ex.TaskTrackersWithoutJobTracker()
+
+        mng_count = sum([ng.count for ng
+                         in u.get_node_groups(cluster, 'manager')])
+        if mng_count != 1:
+            raise i_ex.NotSingleManagerException(mng_count)
+
+    def scale_cluster(self, cluster, instances):
+        ins.configure_os_from_instances(cluster, instances)
+        ins.scale_cluster(cluster, instances)
+
+    def decommission_nodes(self, cluster, instances):
+        ins.decommission_nodes(cluster, instances)
+
+    def validate_scaling(self, cluster, existing, additional):
+        self._validate_additional_ng_scaling(cluster, additional)
+        self._validate_existing_ng_scaling(cluster, existing)
+
+    def _get_scalable_processes(self):
+        return ["datanode", "tasktracker"]
+
+    def _get_by_id(self, lst, id):
+        for obj in lst:
+            if obj.id == id:
+                return obj
+
+    def _validate_additional_ng_scaling(self, cluster, additional):
+        jt = u.get_jobtracker(cluster)
+        scalable_processes = self._get_scalable_processes()
+
+        for ng_id in additional:
+            ng = self._get_by_id(cluster.node_groups, ng_id)
+            if not set(ng.node_processes).issubset(scalable_processes):
+                raise ex.NodeGroupCannotBeScaled(
+                    ng.name, "Intel plugin cannot scale nodegroup"
+                             " with processes: " +
+                             ' '.join(ng.node_processes))
+            if not jt and 'tasktracker' in ng.node_processes:
+                raise ex.NodeGroupCannotBeScaled(
+                    ng.name, "Intel plugin cannot scale node group with "
+                             "processes which have no master-processes run "
+                             "in cluster")
+
+    def _validate_existing_ng_scaling(self, cluster, existing):
+        scalable_processes = self._get_scalable_processes()
+        dn_to_delete = 0
+        for ng in cluster.node_groups:
+            if ng.id in existing:
+                if ng.count > existing[ng.id] and "datanode" in \
+                        ng.node_processes:
+                    dn_to_delete += ng.count - existing[ng.id]
+                if not set(ng.node_processes).issubset(scalable_processes):
+                    raise ex.NodeGroupCannotBeScaled(
+                        ng.name, "Intel plugin cannot scale nodegroup"
+                                 " with processes: " +
+                                 ' '.join(ng.node_processes))
+
+    def _set_cluster_info(self, cluster):
+        mng = u.get_instances(cluster, 'manager')[0]
+        nn = u.get_namenode(cluster)
+        jt = u.get_jobtracker(cluster)
+        oozie = u.get_oozie(cluster)
+
+        #TODO(alazarev) make port configurable (bug #1262895)
+        info = {'IDH Manager': {
+            'Web UI': 'https://%s:9443' % mng.management_ip
+        }}
+
+        if jt:
+            #TODO(alazarev) make port configurable (bug #1262895)
+            info['MapReduce'] = {
+                'Web UI': 'http://%s:50030' % jt.management_ip
+            }
+        if nn:
+            #TODO(alazarev) make port configurable (bug #1262895)
+            info['HDFS'] = {
+                'Web UI': 'http://%s:50070' % nn.management_ip
+            }
+
+        if oozie:
+            #TODO(alazarev) make port configurable (bug #1262895)
+            info['JobFlow'] = {
+                'Oozie': 'http://%s:11000' % oozie.management_ip
+            }
+
+        ctx = context.ctx()
+        conductor.cluster_update(ctx, cluster, {'info': info})
diff --git a/savanna/plugins/intel/resources/configuration.xsd b/savanna/plugins/intel/resources/configuration.xsd
new file mode 100644
index 00000000..b5573d09
--- /dev/null
+++ b/savanna/plugins/intel/resources/configuration.xsd
@@ -0,0 +1,103 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<xs:schema xmlns:xs="http://www.w3.org/2001/XMLSchema">
+  <xs:complexType name="display">
+    <xs:sequence>
+      <xs:element name="en">
+        <xs:simpleType>
+          <xs:restriction base="xs:string">
+            <xs:minLength value="1" />
+          </xs:restriction>
+        </xs:simpleType>
+      </xs:element>
+    </xs:sequence>
+  </xs:complexType>
+  <xs:simpleType name="valueType">
+    <xs:restriction base="xs:string">
+      <xs:enumeration value="Boolean" />
+      <xs:enumeration value="Integer" />
+      <xs:enumeration value="Float" />
+      <xs:enumeration value="IP" />
+      <xs:enumeration value="Port" />
+      <xs:enumeration value="IPWithPort" />
+      <xs:enumeration value="IPWithMask" />
+      <xs:enumeration value="URL" />
+      <xs:enumeration value="String" />
+      <xs:enumeration value="MepRedCapacity" />
+      <xs:enumeration value="HBaseClientScannerCaching" />
+      <xs:enumeration value="Class" />
+      <xs:enumeration value="Choose" />
+      <xs:enumeration value="Directory" />
+      <xs:enumeration value="Int_range" />
+    </xs:restriction>
+  </xs:simpleType>
+  <xs:element name="configuration">
+    <xs:complexType mixed="true">
+      <xs:sequence>
+        <xs:element name="property" maxOccurs="unbounded">
+          <xs:complexType>
+            <xs:all>
+              <xs:element name="name" type="xs:string" />
+              <xs:element name="value" type="xs:string" />
+              <xs:element name="intel_default" type="xs:string" minOccurs="0" />
+              <xs:element name="recommendation" type="xs:string" minOccurs="0" />
+              <xs:element name="valuetype" type="valueType" />
+              <xs:element name="group" type="xs:string" />
+              <xs:element name="definition" type="display" />
+              <xs:element name="description" type="display" />
+              <xs:element name="global" type="xs:boolean" minOccurs="0" />
+              <xs:element name="allowempty" type="xs:boolean" minOccurs="0" />
+              <xs:element name="readonly" type="xs:boolean" minOccurs="0" />
+              <xs:element name="hide" type="xs:boolean" minOccurs="0" />
+              <xs:element name="automatic" type="xs:boolean" minOccurs="0" />
+              <xs:element name="enable" type="xs:boolean" minOccurs="0" />
+              <xs:element name="reserved" type="xs:boolean" minOccurs="0" />
+              <xs:element name="radios" type="xs:string" minOccurs="0" />
+              <xs:element name="script" type="xs:string" minOccurs="0" />
+              <xs:element name="type" type="xs:string" minOccurs="0" />
+              <xs:element name="form" type="xs:string" minOccurs="0" />
+              <xs:element name="chooselist" type="xs:string" minOccurs="0" />
+              <xs:element name="implementation" type="xs:string" minOccurs="0" />
+              <xs:element name="sectionname" type="xs:string" minOccurs="0" />
+              <xs:element name="refor" minOccurs="0">
+                <xs:complexType>
+                  <xs:all>
+                    <xs:element name="refand">
+                      <xs:complexType>
+                        <xs:all>
+                          <xs:element name="value" type="xs:string" />
+                          <xs:element name="valuetype" type="valueType" />
+                          <xs:element name="index" type="xs:string" />
+                        </xs:all>
+                      </xs:complexType>
+                    </xs:element>
+                  </xs:all>
+                </xs:complexType>
+              </xs:element>
+            </xs:all>
+            <xs:attribute name="skipInDoc" type="xs:boolean" />
+          </xs:complexType>
+        </xs:element>
+        <xs:element name="briefsection" minOccurs="0" maxOccurs="unbounded">
+          <xs:complexType>
+            <xs:all>
+              <xs:element name="sectionname" type="xs:string" />
+              <xs:element name="name_en" type="xs:string" />
+              <xs:element name="description_en" type="xs:string" minOccurs="0" />
+              <xs:element name="autoexpand" type="xs:boolean" />
+              <xs:element name="showdescription" type="xs:boolean" />
+            </xs:all>
+          </xs:complexType>
+        </xs:element>
+        <xs:element name="group" minOccurs="1" maxOccurs="unbounded">
+          <xs:complexType>
+            <xs:all>
+              <xs:element name="id" type="xs:string" />
+              <xs:element name="name_en" type="xs:string" />
+              <xs:element name="description_en" type="xs:string" />
+            </xs:all>
+          </xs:complexType>
+        </xs:element>
+      </xs:sequence>
+    </xs:complexType>
+  </xs:element>
+</xs:schema>
\ No newline at end of file
diff --git a/savanna/plugins/intel/resources/hadoop-default.xml b/savanna/plugins/intel/resources/hadoop-default.xml
new file mode 100644
index 00000000..6c85ee58
--- /dev/null
+++ b/savanna/plugins/intel/resources/hadoop-default.xml
@@ -0,0 +1,1371 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<?xml-stylesheet type="text/xsl" href="configuration.xsl"?>
+<!--
+    Do not modify this file directly. Instead, copy entries that you --><!--
+    wish to modify from this file into core-site.xml and change them --><!--
+    there. If core-site.xml does not already exist, create it. -->
+<configuration xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+               xsi:noNamespaceSchemaLocation="configuration.xsd">
+    <!--- global properties -->
+    <property>
+        <name>default.heap.size</name>
+        <value>4096</value>
+        <valuetype>Integer</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>The default heap size of cluster</en>
+        </definition>
+        <global>true</global>
+        <description>
+            <en>Default memory size for datanode, jobtracker and hbase master.</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.extra.classpath</name>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>String</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>Extra Java CLASSPATH element</en>
+        </definition>
+        <global>true</global>
+        <description>
+            <en>Extra Java CLASSPATH elements. Will be appended to the value of HADOOP_CLASSPATH in hadoop-env.sh.</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.tmp.dir</name>
+        <readonly>true</readonly>
+        <value>/tmp/hadoop-${user.name}</value>
+        <valuetype>String</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>The temp directory for hadoop</en>
+        </definition>
+        <description>
+            <en>A base for other temporary directories.</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.native.lib</name>
+        <readonly>true</readonly>
+        <value>true</value>
+        <valuetype>Boolean</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>use the native hadoop libraries</en>
+        </definition>
+        <description>
+            <en>Should native hadoop libraries, if present, be used.</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.http.filter.initializers</name>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>String</valuetype>
+        <group>network</group>
+        <definition>
+            <en>hadoop web filter</en>
+        </definition>
+        <description>
+            <en>A comma separated list of class names. Each class in the list
+                must extend org.apache.hadoop.http.FilterInitializer. The
+                corresponding Filter will be initialized. Then, the Filter will be
+                applied to all user viewing jsp and servlet web pages. The ordering
+                of the list defines the ordering of the filters.</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.security.group.mapping</name>
+        <value>org.apache.hadoop.security.ShellBasedUnixGroupsMapping</value>
+        <valuetype>Class</valuetype>
+        <group>security</group>
+        <definition>
+            <en>hadoop user mapping</en>
+        </definition>
+        <description>
+            <en>Class for user to group mapping (get groups for a given user)</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.security.authorization</name>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>security</group>
+        <definition>
+            <en>hadoop security authorization</en>
+        </definition>
+        <description>
+            <en>Is service-level authorization enabled?</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.security.authentication</name>
+        <value>simple</value>
+        <valuetype>Choose</valuetype>
+        <chooselist>simple,kerberos</chooselist>
+        <group>security</group>
+        <definition>
+            <en>hadoop security authorization level</en>
+        </definition>
+        <description>
+            <en>possible values are simple (no authentication), and kerberos</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.security.token.service.use_ip</name>
+        <value>true</value>
+        <valuetype>Boolean</valuetype>
+        <group>security</group>
+        <definition>
+            <en>Controls whether tokens always use IP addresses</en>
+        </definition>
+        <description>
+            <en>
+            Controls whether tokens always use IP addresses. DNS changes will not
+            be detected if this option is enabled. Existing client connections
+            that break will always reconnect to the IP of the original host. New
+            clients will connect to the host's new IP but fail to locate a token.
+            Disabling this option will allow existing and new clients to detect
+            an IP change and continue to locate the new host's token.
+        </en>
+        </description>
+    </property>
+    <!-- <property> <name>hadoop.security.service.user.name.key</name> <value></value>
+        <description>Name of the kerberos principal of the user that owns a given
+        service daemon </description> </property> -->
+    <property>
+        <name>hadoop.workaround.non.threadsafe.getpwuid</name>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>security</group>
+        <definition>
+            <en>hadoop thread safe</en>
+        </definition>
+        <description>
+            <en>Some operating systems or authentication modules are known to
+  have broken implementations of getpwuid_r and getpwgid_r, such that these
+  calls are not thread-safe. Symptoms of this problem include JVM crashes
+  with a stack trace inside these functions. If your system exhibits this
+  issue, enable this configuration parameter to include a lock around the
+  calls as a workaround.
+  An incomplete list of some systems known to have this issue is available
+  at http://wiki.apache.org/hadoop/KnownBrokenPwuidImplementations</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.kerberos.kinit.command</name>
+        <readonly>true</readonly>
+        <value>kinit</value>
+        <valuetype>String</valuetype>
+        <group>security</group>
+        <definition>
+            <en>Kerberos credentials</en>
+        </definition>
+        <description>
+            <en>Used to periodically renew Kerberos credentials when provided
+  to Hadoop. The default setting assumes that kinit is in the PATH of users
+  running the Hadoop client. Change this to the absolute path to kinit if this
+  is not the case.</en>
+        </description>
+    </property>
+    <!--- logging properties -->
+    <property>
+        <name>hadoop.logfile.size</name>
+        <enable>false</enable>
+        <value>10000000</value>
+        <valuetype>Integer</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>log file size</en>
+        </definition>
+        <description>
+            <en>The max size of each log file</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.logfile.count</name>
+        <enable>false</enable>
+        <value>10</value>
+        <valuetype>Integer</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>log file number</en>
+        </definition>
+        <description>
+            <en>The max number of log files</en>
+        </description>
+    </property>
+    <!-- i/o properties -->
+    <property>
+        <name>io.file.buffer.size</name>
+        <value>4096</value>
+        <valuetype>Integer</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>File buffer size</en>
+        </definition>
+        <description>
+            <en>The size of buffer for use in sequence files.
+  The size of this buffer should probably be a multiple of hardware
+  page size (4096 on Intel x86), and it determines how much data is
+  buffered during read and write operations.</en>
+        </description>
+    <sectionname>basic</sectionname>
+    <form>TextItem</form>
+    <allowempty>true</allowempty>
+    </property>
+    <property>
+        <name>io.bytes.per.checksum</name>
+        <value>512</value>
+        <intel_default>512</intel_default>
+        <recommendation>4096</recommendation>
+        <valuetype>Integer</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>Checksum size</en>
+        </definition>
+        <description>
+            <en>The number of bytes per checksum.  Must not be larger than
+  io.file.buffer.size.</en>
+        </description>
+    <sectionname>ioconf</sectionname>
+    <form>TextItem</form>
+    <allowempty>false</allowempty>
+    </property>
+    <property>
+        <name>dfs.datanode.protocol.client-request.client-verification-field.exists</name>
+        <value>false</value>
+        <recommendation>true</recommendation>
+        <valuetype>Boolean</valuetype>
+        <group>io</group>
+        <definition>
+            <en>checksum.client-verification-field</en>
+        </definition>
+        <description>
+            <en>Allow DataNode to skip loading Checksum files.</en>
+        </description>
+        <allowempty>true</allowempty>
+    </property>
+    <property>
+        <name>io.skip.checksum.errors</name>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>io</group>
+        <definition>
+            <en>Skip checksum errors</en>
+        </definition>
+        <description>
+            <en>If true, when a checksum error is encountered while
+  reading a sequence file, entries are skipped, instead of throwing an
+  exception.</en>
+        </description>
+    <sectionname>ioconf</sectionname>
+    <form>RadioGroupItem</form>
+    <radios>true,false</radios>
+    <allowempty>false</allowempty>
+    </property>
+    <property>
+        <name>io.compression.codecs</name>
+        <value>org.apache.hadoop.io.compress.DefaultCodec,org.apache.hadoop.io.compress.GzipCodec,org.apache.hadoop.io.compress.BZip2Codec,org.apache.hadoop.io.compress.DeflateCodec,org.apache.hadoop.io.compress.SnappyCodec</value>
+        <valuetype>Class</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>Compression codecs</en>
+        </definition>
+        <description>
+            <en>A list of the compression codec classes that can be used
+               for compression/decompression.</en>
+        </description>
+    </property>
+    <property>
+        <name>io.serializations</name>
+        <value>org.apache.hadoop.io.serializer.WritableSerialization</value>
+        <valuetype>Class</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>Io serializaions</en>
+        </definition>
+        <description>
+            <en>A list of serialization classes that can be used for
+  obtaining serializers and deserializers.
+    </en>
+        </description>
+    </property>
+    <!-- file system properties -->
+    <property>
+        <name>fs.default.name</name>
+        <enable>false</enable>
+        <value>file:///</value>
+        <valuetype>String</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>File System name</en>
+        </definition>
+        <global>true</global>
+        <description>
+            <en>The name of the default file system.  A URI whose
+  scheme and authority determine the FileSystem implementation.  The
+  uri's scheme determines the config property (fs.SCHEME.impl) naming
+  the FileSystem implementation class.  The uri's authority is used to
+  determine the host, port, etc. for a filesystem.
+     </en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.namenode</name>
+        <value></value>
+        <allowempty>true</allowempty>
+        <global>true</global>
+        <valuetype>String</valuetype>
+        <group>namenode</group>
+        <definition>
+            <en>NameNode name</en>
+        </definition>
+        <description>
+            <en>Server name for namenode.</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.namenode.port</name>
+        <value>8020</value>
+        <valuetype>String</valuetype>
+        <group>namenode</group>
+        <definition>
+            <en>NameNode port</en>
+        </definition>
+        <global>true</global>
+        <description>
+            <en>Server port for namenode.</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.trash.interval</name>
+        <value>0</value>
+        <valuetype>Integer</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>Interval to delete checkpoints</en>
+        </definition>
+        <description>
+            <en>Number of minutes after which the checkpoints
+      get deleted. If zero, the trash feature is disabled.</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.file.impl</name>
+        <value>org.apache.hadoop.fs.LocalFileSystem</value>
+        <valuetype>Class</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>File system for file implementation</en>
+        </definition>
+        <implementation>org.apache.hadoop.fs.FileSystem</implementation>
+        <description>
+            <en>The FileSystem for file: uris.</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.hdfs.impl</name>
+        <value>org.apache.hadoop.hdfs.DistributedFileSystem</value>
+        <valuetype>Class</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>File system for hdfs implementation</en>
+        </definition>
+        <implementation>org.apache.hadoop.fs.FileSystem</implementation>
+        <description>
+            <en>The FileSystem for hdfs: uris.</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.webhdfs.impl</name>
+        <value>org.apache.hadoop.hdfs.web.WebHdfsFileSystem</value>
+        <valuetype>Class</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>File system for webhdfs implementation</en>
+        </definition>
+        <implementation>org.apache.hadoop.fs.FileSystem</implementation>
+        <description>
+            <en>The FileSystem for webhdfs: uris.</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.s3.impl</name>
+        <value>org.apache.hadoop.fs.s3.S3FileSystem</value>
+        <valuetype>Class</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>File system for s3 implementation</en>
+        </definition>
+        <implementation>org.apache.hadoop.fs.FileSystem</implementation>
+        <description>
+            <en>The FileSystem for s3: uris.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>fs.s3n.impl</name>
+        <value>org.apache.hadoop.fs.s3native.NativeS3FileSystem</value>
+        <valuetype>Class</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>File system for s3n implementation</en>
+        </definition>
+        <implementation>org.apache.hadoop.fs.FileSystem</implementation>
+        <description>
+            <en>The FileSystem for s3n: (Native S3) uris.</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.kfs.impl</name>
+        <value>org.apache.hadoop.fs.kfs.KosmosFileSystem</value>
+        <valuetype>Class</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>File system for kfs implementation</en>
+        </definition>
+        <implementation>org.apache.hadoop.fs.FileSystem</implementation>
+        <description>
+            <en>The FileSystem for kfs: uris.</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.hftp.impl</name>
+        <value>org.apache.hadoop.hdfs.HftpFileSystem</value>
+        <valuetype>Class</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>File system for hftp implementation</en>
+        </definition>
+        <implementation>org.apache.hadoop.fs.FileSystem</implementation>
+        <description>
+            <en>The FileSystem for hftp: uris.</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.hsftp.impl</name>
+        <value>org.apache.hadoop.hdfs.HsftpFileSystem</value>
+        <valuetype>Class</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>The FileSystem for hsftp</en>
+        </definition>
+        <implementation>org.apache.hadoop.fs.FileSystem</implementation>
+        <description>
+            <en>The FileSystem for hsftp: uris</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.ftp.impl</name>
+        <value>org.apache.hadoop.fs.ftp.FTPFileSystem</value>
+        <valuetype>Class</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>File system for ftp implementation</en>
+        </definition>
+        <implementation>org.apache.hadoop.fs.FileSystem</implementation>
+        <description>
+            <en>The FileSystem for ftp: uris.</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.ramfs.impl</name>
+        <value>org.apache.hadoop.fs.InMemoryFileSystem</value>
+        <valuetype>Class</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>File system for ramfs implementation</en>
+        </definition>
+        <implementation>org.apache.hadoop.fs.FileSystem</implementation>
+        <description>
+            <en>The FileSystem for ramfs: uris.</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.har.impl</name>
+        <value>org.apache.hadoop.fs.HarFileSystem</value>
+        <valuetype>Class</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>File system for hadoop archives implementation</en>
+        </definition>
+        <implementation>org.apache.hadoop.fs.FileSystem</implementation>
+        <description>
+            <en>The filesystem for Hadoop archives.</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.har.impl.disable.cache</name>
+        <value>true</value>
+        <valuetype>Boolean</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>Cache hadoop archive instance</en>
+        </definition>
+        <description>
+            <en>Don't cache 'har' filesystem instances.</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.checkpoint.dir</name>
+        <value>${hadoop.tmp.dir}/dfs/namesecondary</value>
+        <intel_default>${hadoop.tmp.dir}/dfs/namesecondary</intel_default>
+        <recommendation>/hadoop/namesecondary</recommendation>
+        <valuetype>Directory</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>Checkpoint directory</en>
+        </definition>
+        <description>
+            <en>Determines where on the local filesystem the DFS secondary
+      name node should store the temporary images to merge.
+      If this is a comma-delimited list of directories then the image is
+      replicated in all of the directories for redundancy.</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.checkpoint.edits.dir</name>
+        <value>${fs.checkpoint.dir}</value>
+        <valuetype>Directory</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>Checkpoint edit directory</en>
+        </definition>
+        <description>
+            <en>Determines where on the local filesystem the DFS secondary
+      name node should store the temporary edits to merge.
+      If this is a comma-delimited list of directoires then the edits is
+      replicated in all of the directoires for redundancy.
+      Default value is same as fs.checkpoint.dir</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.checkpoint.period</name>
+        <value>3600</value>
+        <valuetype>Integer</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>Checkpoint period</en>
+        </definition>
+        <description>
+            <en>The number of seconds between two periodic checkpoints.</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.checkpoint.size</name>
+        <value>67108864</value>
+        <valuetype>Integer</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>Edit log size to checkpoint</en>
+        </definition>
+        <description>
+            <en>The size of the current edit log (in bytes) that triggers
+       a periodic checkpoint even if the fs.checkpoint.period hasn't expired.</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.s3.block.size</name>
+        <value>67108864</value>
+        <valuetype>Integer</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>Block size to write to S3</en>
+        </definition>
+        <description>
+            <en>Block size to use when writing files to S3.</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.s3.buffer.dir</name>
+        <value>${hadoop.tmp.dir}/s3</value>
+        <valuetype>Directory</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>Buffer file directory</en>
+        </definition>
+        <description>
+            <en>Determines where on the local filesystem the S3 filesystem
+  should store files before sending them to S3
+  (or after retrieving them from S3).
+</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.s3.maxRetries</name>
+        <value>4</value>
+        <valuetype>Integer</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>Maximum retries number to reading or writing file to S3</en>
+        </definition>
+        <description>
+            <en>The maximum number of retries for reading or writing files to S3,
+  before we signal failure to the application.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.s3.sleepTimeSeconds</name>
+        <value>10</value>
+        <valuetype>Integer</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>Seconds to sleep between every retries to reading or writing file to S3</en>
+        </definition>
+        <description>
+            <en>The number of seconds to sleep between each S3 retry.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.automatic.close</name>
+        <value>true</value>
+        <valuetype>Boolean</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>FileSystem auto close</en>
+        </definition>
+        <description>
+            <en>By default, FileSystem instances are automatically closed at program
+  exit using a JVM shutdown hook. Setting this property to false disables this
+  behavior. This is an advanced option that should only be used by server applications
+  requiring a more carefully orchestrated shutdown sequence.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>fs.s3n.block.size</name>
+        <value>67108864</value>
+        <valuetype>Integer</valuetype>
+        <group>filesystem</group>
+        <definition>
+            <en>Block size</en>
+        </definition>
+        <description>
+            <en>Block size to use when reading files using the Native S3
+  filesystem (s3n: URIs).</en>
+        </description>
+    </property>
+    <property>
+        <name>local.cache.size</name>
+        <value>10737418240</value>
+        <valuetype>Integer</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>cache size</en>
+        </definition>
+        <description>
+            <en>
+            The limit on the size of cache you want to keep, set by default to
+            10GB. This will act as a soft limit on the cache directory for out of
+            band data.
+            </en>
+        </description>
+    </property>
+    <property>
+        <name>io.seqfile.compress.blocksize</name>
+        <value>1000000</value>
+        <valuetype>Integer</valuetype>
+        <group>io</group>
+        <definition>
+            <en>Minum block size for compression</en>
+        </definition>
+        <description>
+            <en>The minimum block size for compression in block compressed
+          SequenceFiles.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>io.seqfile.lazydecompress</name>
+        <value>true</value>
+        <valuetype>Boolean</valuetype>
+        <group>io</group>
+        <definition>
+            <en>Lazy decompress</en>
+        </definition>
+        <description>
+            <en>Should values of block-compressed SequenceFiles be decompressed
+          only when necessary.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>io.seqfile.sorter.recordlimit</name>
+        <value>1000000</value>
+        <valuetype>Integer</valuetype>
+        <group>io</group>
+        <definition>
+            <en>Limit number of records</en>
+        </definition>
+        <description>
+            <en>The limit on number of records to be kept in memory in a spill
+          in SequenceFiles.Sorter
+</en>
+        </description>
+    </property>
+    <property>
+        <name>io.mapfile.bloom.size</name>
+        <value>1048576</value>
+        <valuetype>Integer</valuetype>
+        <group>io</group>
+        <definition>
+            <en>The size of BloomFilters</en>
+        </definition>
+        <description>
+            <en>The size of BloomFilter-s used in BloomMapFile. Each time this many
+  keys is appended the next BloomFilter will be created (inside a DynamicBloomFilter).
+  Larger values minimize the number of filters, which slightly increases the performance,
+  but may waste too much space if the total number of keys is usually much smaller
+  than this number.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>io.mapfile.bloom.error.rate</name>
+        <value>0.005</value>
+        <valuetype>Float</valuetype>
+        <group>io</group>
+        <definition>
+            <en>Rate of false positives in BloomFilter</en>
+        </definition>
+        <description>
+            <en>The rate of false positives in BloomFilter-s used in BloomMapFile.
+  As this value decreases, the size of BloomFilter-s increases exponentially. This
+  value is the probability of encountering false positives (default is 0.5%).
+</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.util.hash.type</name>
+        <value>murmur</value>
+        <valuetype>Choose</valuetype>
+        <chooselist>murmur,jenkins</chooselist>
+        <group>basic</group>
+        <definition>
+            <en>Hash type</en>
+        </definition>
+        <description>
+            <en>The default implementation of Hash. Currently this can take one of the
+  two values: 'murmur' to select MurmurHash and 'jenkins' to select JenkinsHash.
+</en>
+        </description>
+    </property>
+    <!-- ipc properties -->
+    <property>
+        <name>ipc.client.idlethreshold</name>
+        <value>4000</value>
+        <valuetype>Integer</valuetype>
+        <group>ipc</group>
+        <definition>
+            <en>Connection threshold</en>
+        </definition>
+        <description>
+            <en>Defines the threshold number of connections after which
+               connections will be inspected for idleness.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>ipc.client.kill.max</name>
+        <value>10</value>
+        <valuetype>Integer</valuetype>
+        <group>ipc</group>
+        <definition>
+            <en>Maximum clients number</en>
+        </definition>
+        <description>
+            <en>Defines the maximum number of clients to disconnect in one go.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>ipc.client.connection.maxidletime</name>
+        <value>10000</value>
+        <valuetype>Integer</valuetype>
+        <group>ipc</group>
+        <definition>
+            <en>Maximum time for connection</en>
+        </definition>
+        <description>
+            <en>The maximum time in msec after which a client will bring down the
+               connection to the server.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>ipc.client.connect.max.retries</name>
+        <value>10</value>
+        <valuetype>Integer</valuetype>
+        <group>ipc</group>
+        <definition>
+            <en>Maximum number retries</en>
+        </definition>
+        <description>
+            <en>Indicates the number of retries a client will make to establish
+               a server connection.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>ipc.server.listen.queue.size</name>
+        <value>128</value>
+        <valuetype>Integer</valuetype>
+        <group>ipc</group>
+        <definition>
+            <en>Length of the server listen queue</en>
+        </definition>
+        <description>
+            <en>Indicates the length of the listen queue for servers accepting
+               client connections.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>ipc.server.tcpnodelay</name>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>ipc</group>
+        <definition>
+            <en>Turn on Nagle's algorithem</en>
+        </definition>
+        <description>
+            <en>Turn on/off Nagle's algorithm for the TCP socket connection on
+  the server. Setting to true disables the algorithm and may decrease latency
+  with a cost of more/smaller packets.
+</en>
+        </description>
+    </property>
+        <property>
+        <name>ipc.client.tcpnodelay</name>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>ipc</group>
+        <definition>
+            <en>Whether to Turn on Nagle's algorithem on the client</en>
+        </definition>
+        <description>
+            <en>Turn on/off Nagle's algorithm for the TCP socket connection on
+  the client. Setting to true disables the algorithm and may decrease latency
+  with a cost of more/smaller packets.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>webinterface.private.actions</name>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>network</group>
+        <definition>
+            <en>Web interfaces</en>
+        </definition>
+        <description>
+            <en> If set to true, the web interfaces of JT and NN may contain
+                actions, such as kill job, delete file, etc., that should
+                not be exposed to public. Enable this option if the interfaces
+                are only reachable by those who have the right authorization.
+</en>
+        </description>
+    </property>
+    <!-- Proxy Configuration -->
+    <property>
+        <name>hadoop.rpc.socket.factory.class.default</name>
+        <value>org.apache.hadoop.net.StandardSocketFactory</value>
+        <valuetype>Class</valuetype>
+        <group>proxy</group>
+        <definition>
+            <en>Socketfactory Class</en>
+        </definition>
+        <description>
+            <en> Default SocketFactory to use. This parameter is expected to be
+    formatted as "package.FactoryClassName".
+</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.rpc.socket.factory.class.ClientProtocol</name>
+        <value></value>
+        <valuetype>Class</valuetype>
+        <group>proxy</group>
+        <definition>
+            <en>Socketfactory Class to use to Connect to DFS</en>
+        </definition>
+        <description>
+            <en> SocketFactory to use to connect to a DFS. If null or empty, use
+    hadoop.rpc.socket.class.default. This socket factory is also used by
+    DFSClient to create sockets to DataNodes.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.socks.server</name>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>String</valuetype>
+        <group>proxy</group>
+        <definition>
+            <en>Address used by SocksSocketfactory </en>
+        </definition>
+        <description>
+            <en> Address (host:port) of the SOCKS server to be used by the
+    SocksSocketFactory.
+</en>
+        </description>
+    </property>
+    <!-- Rack Configuration -->
+    <property>
+        <name>topology.node.switch.mapping.impl</name>
+        <value>org.apache.hadoop.net.ScriptBasedMapping</value>
+        <valuetype>Class</valuetype>
+        <implementation>org.apache.hadoop.net.DNSToSwitchMapping</implementation>
+        <group>rack</group>
+        <definition>
+            <en>Topology node switch mapping implemention</en>
+        </definition>
+        <description>
+            <en> The default implementation of the DNSToSwitchMapping. It
+    invokes a script specified in topology.script.file.name to resolve
+    node names. If the value for topology.script.file.name is not set, the
+    default value of DEFAULT_RACK is returned for all node names.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>topology.script.file.name</name>
+        <enable>false</enable>
+        <value></value>
+        <intel_default></intel_default>
+        <recommendation>/usr/lib/intelcloud/rackmap.sh</recommendation>
+        <valuetype>String</valuetype>
+        <group>rack</group>
+        <definition>
+            <en>The script name to get NetworkTopology name</en>
+        </definition>
+        <readonly>true</readonly>
+        <description>
+            <en> The script name that should be invoked to resolve DNS names to
+    NetworkTopology names. Example: the script would take host.foo.bar as an
+    argument, and return /rack1 as the output.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>topology.script.number.args</name>
+        <enable>false</enable>
+        <value>100</value>
+        <intel_default>100</intel_default>
+        <recommendation>1</recommendation>
+        <valuetype>Integer</valuetype>
+        <group>rack</group>
+        <definition>
+            <en>The number of topology script args</en>
+        </definition>
+        <readonly>true</readonly>
+        <description>
+            <en> The max number of args that the script configured with
+    topology.script.file.name should be run with. Each arg is an
+    IP address.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.security.uid.cache.secs</name>
+        <value>14400</value>
+        <valuetype>Integer</valuetype>
+        <group>security</group>
+        <definition>
+            <en>The timeout for cache from UID to UserName</en>
+        </definition>
+        <description>
+            <en> NativeIO maintains a cache from UID to UserName. This is
+  the timeout for an entry in that cache. </en>
+        </description>
+    </property>
+    <!-- HTTP web-consoles Authentication -->
+    <property>
+        <name>hadoop.http.authentication.type</name>
+        <value>simple</value>
+        <!--<recommendation>${hadoop.security.authentication}</recommendation> -->
+        <valuetype>Choose</valuetype>
+        <chooselist>simple,kerberos,${hadoop.security.authentication}</chooselist>
+        <group>security</group>
+        <definition>
+            <en>Authentication type for HTTP endpoint</en>
+        </definition>
+        <description>
+            <en>
+    Defines authentication used for Oozie HTTP endpoint.
+    Supported values are: simple | kerberos | #AUTHENTICATION_HANDLER_CLASSNAME#
+</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.http.authentication.token.validity</name>
+        <value>36000</value>
+        <valuetype>Integer</valuetype>
+        <group>security</group>
+        <definition>
+            <en>Authentication token validity</en>
+        </definition>
+        <description>
+            <en>
+    Indicates how long (in seconds) an authentication token is valid before it has
+    to be renewed.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.http.authentication.signature.secret</name>
+        <value>hadoop</value>
+        <valuetype>String</valuetype>
+        <group>security</group>
+        <definition>
+            <en>The signature secret for signing the Authentication token</en>
+        </definition>
+        <description>
+            <en>
+    The signature secret for signing the authentication tokens.
+    If not set a random secret is generated at startup time.
+    The same secret should be used for JT/NN/DN/TT configurations.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.http.authentication.cookie.domain</name>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>String</valuetype>
+        <group>security</group>
+        <definition>
+            <en>The domain to store authentication token</en>
+        </definition>
+        <description>
+            <en>
+    The domain to use for the HTTP cookie that stores the authentication token.
+    In order to authentiation to work correctly across all Hadoop nodes web-consoles
+    the domain must be correctly set.
+    IMPORTANT: when using IP addresses, browsers ignore cookies with domain settings.
+    For this setting to work properly all nodes, the cluster must be configured
+    to generate URLs with hostname.domain names on it.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.http.authentication.simple.anonymous.allowed</name>
+        <value>true</value>
+        <valuetype>Boolean</valuetype>
+        <group>security</group>
+        <definition>
+            <en>Simple authentication anonymous allowance</en>
+        </definition>
+        <description>
+            <en>
+    Indicates if anonymous requests are allowed when using 'simple' authentication.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.http.authentication.kerberos.principal</name>
+        <hide>true</hide>
+        <type>1</type>
+        <value>HTTP/localhost@LOCALHOST</value>
+        <valuetype>String</valuetype>
+        <group>security</group>
+        <definition>
+            <en>Authentication principal</en>
+        </definition>
+        <description>
+            <en> Indicates the Kerberos principal to be used for HTTP endpoint.
+                The principal MUST start with 'HTTP/' as per Kerberos HTTP SPNEGO
+                specification.
+            </en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.http.authentication.kerberos.keytab</name>
+        <hide>true</hide>
+        <value>${user.home}/hadoop.keytab</value>
+        <valuetype>String</valuetype>
+        <group>security</group>
+        <definition>
+            <en>Location of keytab file</en>
+        </definition>
+        <description>
+            <en>
+    Location of the keytab file with the credentials for the principal.
+    Referring to the same keytab file Oozie uses for its Kerberos credentials for Hadoop.
+</en>
+        </description>
+    </property>
+    <!-- ACL related -->
+    <property>
+        <name>hadoop.security.group.mapping.ldap.url</name>
+        <readonly>true</readonly>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>String</valuetype>
+        <group>security</group>
+        <definition>
+            <en>The URL of the LDAP server</en>
+        </definition>
+        <description>
+            <en>
+    The URL of the LDAP server to use for resolving user groups when using
+    the LdapGroupsMapping user to group mapping.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.security.group.mapping.ldap.ssl</name>
+        <readonly>true</readonly>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>security</group>
+        <definition>
+            <en>Use SSL connecting to LDAP server</en>
+        </definition>
+        <description>
+            <en>
+    Whether or not to use SSL when connecting to the LDAP server.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.security.group.mapping.ldap.ssl.keystore</name>
+        <readonly>true</readonly>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>String</valuetype>
+        <group>security</group>
+        <definition>
+            <en>File path to the SSL keystore</en>
+        </definition>
+        <description>
+            <en>
+    File path to the SSL keystore that contains the SSL certificate required
+    by the LDAP server.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.security.group.mapping.ldap.ssl.keystore.password.file</name>
+        <readonly>true</readonly>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>String</valuetype>
+        <group>security</group>
+        <definition>
+            <en>File path containing the password of LDAP SSL keystore</en>
+        </definition>
+        <description>
+            <en>
+    The path to a file containing the password of the LDAP SSL keystore.
+    IMPORTANT: This file should be readable only by the Unix user running
+    the daemons.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.security.group.mapping.ldap.bind.user</name>
+        <readonly>true</readonly>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>String</valuetype>
+        <group>security</group>
+        <definition>
+            <en>The user name to bind as when connecting to the LDAP server</en>
+        </definition>
+        <description>
+            <en>
+    The distinguished name of the user to bind as when connecting to the LDAP
+    server. This may be left blank if the LDAP server supports anonymous binds.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.security.group.mapping.ldap.bind.password.file</name>
+        <readonly>true</readonly>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>String</valuetype>
+        <group>security</group>
+        <definition>
+            <en>The path to a file containing the password of the bind user</en>
+        </definition>
+        <description>
+            <en>
+    The path to a file containing the password of the bind user.
+    IMPORTANT: This file should be readable only by the Unix user running
+    the daemons.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.security.group.mapping.ldap.base</name>
+        <readonly>true</readonly>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>String</valuetype>
+        <group>security</group>
+        <definition>
+            <en>The search base for the LDAP connection</en>
+        </definition>
+        <description>
+            <en>
+    The search base for the LDAP connection. This is a distinguished name,
+    and will typically be the root of the LDAP directory.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.security.group.mapping.ldap.search.filter.user</name>
+        <readonly>true</readonly>
+        <value>(&amp;(objectClass=user)(sAMAccountName={0}))</value>
+        <valuetype>String</valuetype>
+        <group>security</group>
+        <definition>
+            <en>An filter to use when searching for LDAP users</en>
+        </definition>
+        <description>
+            <en>
+    An additional filter to use when searching for LDAP users. The default will
+    usually be appropriate for Active Directory installations. If connecting to
+    an LDAP server with a non-AD schema, this should be replaced with
+    (&amp;(objectClass=inetOrgPerson)(uid={0}). {0} is a special string used to
+    denote where the username fits into the filter.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.security.group.mapping.ldap.search.filter.group</name>
+        <readonly>true</readonly>
+        <value>(objectClass=group)</value>
+        <valuetype>String</valuetype>
+        <group>security</group>
+        <definition>
+            <en>An filter to use when searching for LDAP groups</en>
+        </definition>
+        <description>
+            <en>
+    An additional filter to use when searching for LDAP groups. This should be
+    changed when resolving groups against a non-Active Directory installation.
+    posixGroups are currently not a supported group class.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.security.group.mapping.ldap.search.attr.member</name>
+        <readonly>true</readonly>
+        <value>member</value>
+        <valuetype>String</valuetype>
+        <group>security</group>
+        <definition>
+            <en>The attribute identifying the users that are members of the group</en>
+        </definition>
+        <description>
+            <en>
+    The attribute of the group object that identifies the users that are
+    members of the group. The default will usually be appropriate for
+    any LDAP installation.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.security.group.mapping.ldap.search.attr.group.name</name>
+        <value>cn</value>
+        <valuetype>String</valuetype>
+        <group>security</group>
+        <definition>
+            <en>The attribute identifying the group name</en>
+        </definition>
+        <description>
+            <en>
+    The attribute of the group object that identifies the group name. The
+    default will usually be appropriate for all LDAP systems.
+</en>
+        </description>
+    </property><!--
+    <property>
+        <name>hdfs.namenode</name>
+        <value></value>
+        <valuetype>String</valuetype>
+        <group>namenode</group>
+        <definition>
+            <en>NameNode</en>
+        </definition>
+        <sectionname>basic</sectionname>
+        <description>
+            <en>Host name or IP address of namenode</en>
+        </description>
+        <form>TextItem</form>
+        <allowempty>true</allowempty>
+    </property>
+   -->
+    <briefsection>
+        <sectionname>basic</sectionname>
+        <name_en>Hadoop Basic</name_en>
+        <autoexpand>true</autoexpand>
+        <showdescription>false</showdescription>
+    </briefsection>
+    <briefsection>
+        <sectionname>ioconf</sectionname>
+        <name_en>Hadoop IO</name_en>
+        <autoexpand>true</autoexpand>
+        <showdescription>false</showdescription>
+    </briefsection>
+    <group>
+        <id>basic</id>
+        <name_en>Basic Configuration</name_en>
+        <description_en>Basic configurations that get Hadoop running.</description_en>
+    </group>
+    <group>
+        <id>perf</id>
+        <name_en>Performance</name_en>
+        <description_en>Configurations that affect Hadoop's performance</description_en>
+    </group>
+    <group>
+        <id>security</id>
+        <name_en>Security</name_en>
+        <description_en>Security configurations like Kerberos.</description_en>
+    </group>
+    <group>
+        <id>network</id>
+        <name_en>Network Setting</name_en>
+        <description_en>Network Setting.</description_en>
+    </group>
+    <group>
+        <id>filesystem</id>
+        <name_en>File System</name_en>
+        <description_en>File System configurations.</description_en>
+    </group>
+    <group>
+        <id>namenode</id>
+        <name_en>Namenode</name_en>
+        <description_en>Configurations for HDFS Namenode.</description_en>
+    </group>
+    <group>
+        <id>io</id>
+        <name_en>IO Configuration</name_en>
+        <description_en>IO Configuration</description_en>
+    </group>
+    <group>
+        <id>ipc</id>
+        <name_en>IPC</name_en>
+        <description_en>IPC Configuration</description_en>
+    </group>
+    <group>
+        <id>proxy</id>
+        <name_en>Proxy Configuration</name_en>
+        <description_en>Proxy Configuration</description_en>
+    </group>
+    <group>
+        <id>rack</id>
+        <name_en>Rack Configuration</name_en>
+        <description_en>Rack Configuration</description_en>
+    </group>
+</configuration>
diff --git a/savanna/plugins/intel/resources/hdfs-default.xml b/savanna/plugins/intel/resources/hdfs-default.xml
new file mode 100644
index 00000000..e86aa73a
--- /dev/null
+++ b/savanna/plugins/intel/resources/hdfs-default.xml
@@ -0,0 +1,1193 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<?xml-stylesheet type="text/xsl" href="configuration.xsl"?>
+<!-- Do not modify this file directly. Instead, copy entries that you -->
+<!-- wish to modify from this file into hdfs-site.xml and change them -->
+<!-- there. If hdfs-site.xml does not already exist, create it. -->
+<configuration xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+    xsi:noNamespaceSchemaLocation="configuration.xsd">
+    <property>
+        <name>hadoop.namenode.memory</name>
+        <value>0</value>
+        <valuetype>Integer</valuetype>
+        <type>1</type>
+        <automatic>true</automatic>
+        <reserved>true</reserved>
+        <group>namenode</group>
+        <definition>
+            <en>Namenode server memory size</en>
+        </definition>
+        <description>
+            <en>Default size for namenode server memory.</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.secondary.namenode.memory</name>
+        <value>0</value>
+        <valuetype>Integer</valuetype>
+        <type>1</type>
+        <automatic>true</automatic>
+        <reserved>true</reserved>
+        <group>namenode</group>
+        <definition>
+            <en>Secondary namenode server memory size</en>
+        </definition>
+        <description>
+            <en>Default size for secondary namenode server memory.</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.datanode.memory</name>
+        <value>4096</value>
+        <valuetype>Integer</valuetype>
+        <type>1</type>
+        <automatic>true</automatic>
+        <reserved>true</reserved>
+        <group>datanode</group>
+        <definition>
+            <en>Datanode server memory size</en>
+        </definition>
+        <description>
+            <en>Default size for datanode server memory.</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.namenode.logging.level</name>
+        <value>info</value>
+        <valuetype>String</valuetype>
+        <group>namenode</group>
+        <definition>
+            <en>Namenode logging level</en>
+        </definition>
+        <description>
+            <en>The logging level for dfs namenode. Other values are "dir"(trac
+e namespace mutations), "block"(trace block under/over replications and block
+creations/deletions), or "all".</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.secondary.http.address</name>
+        <value>0.0.0.0:50090</value>
+        <valuetype>String</valuetype>
+        <enable>false</enable>
+        <group>namenode</group>
+        <definition>
+            <en>Secondary namenode http server address and port</en>
+        </definition>
+        <description>
+            <en>
+    The secondary namenode http server address and port.
+    If the port is 0 then the server will start on a free port.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.datanode.address</name>
+        <value>0.0.0.0:50010</value>
+        <valuetype>String</valuetype>
+        <group>datanode</group>
+        <definition>
+            <en>Address datanode server listens to</en>
+        </definition>
+        <description>
+            <en>
+    The address where the datanode server will listen to.
+    If the port is 0 then the server will start on a free port.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.datanode.http.address</name>
+        <value>0.0.0.0:50075</value>
+        <valuetype>String</valuetype>
+        <group>datanode</group>
+        <definition>
+            <en>Datanode http server address and port</en>
+        </definition>
+        <description>
+            <en>
+    The datanode http server address and port.
+    If the port is 0 then the server will start on a free port.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.datanode.ipc.address</name>
+        <value>0.0.0.0:50020</value>
+        <valuetype>String</valuetype>
+        <group>datanode</group>
+        <definition>
+            <en>Datanode ipc server adderss and port</en>
+        </definition>
+        <description>
+            <en>
+    The datanode ipc server address and port.
+    If the port is 0 then the server will start on a free port.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.block.local-path-access.user</name>
+        <value></value>
+        <recommendation>hbase</recommendation>
+        <valuetype>String</valuetype>
+        <group>datanode</group>
+        <definition>
+            <en>DFS short circuit read allowed user list</en>
+        </definition>
+        <description>
+            <en>The user in this list can directly read the local file system HDFS block,
+            instead of reading through DataNode, thus improving performance,
+            The list is seperated by comma.</en>
+        </description>
+        <allowempty>true</allowempty>
+    </property>
+    <property>
+        <name>dfs.datanode.handler.count</name>
+        <value>3</value>
+        <intel_default>3</intel_default>
+        <recommendation>100</recommendation>
+        <valuetype>Integer</valuetype>
+        <group>datanode</group>
+        <definition>
+            <en>Datanode server threads count</en>
+        </definition>
+        <description>
+            <en>The number of server threads for the datanode.</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.datanode.max.xcievers</name>
+        <value>32768</value>
+        <valuetype>Integer</valuetype>
+        <group>datanode</group>
+        <definition>
+            <en>Datanode service threads count</en>
+        </definition>
+        <description>
+            <en>Number of threads for the datanode service.</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.http.address</name>
+        <value>0.0.0.0:50070</value>
+        <valuetype>String</valuetype>
+        <enable>false</enable>
+        <group>basic</group>
+        <definition>
+            <en>Namenode Web UI address and port</en>
+        </definition>
+        <description>
+            <en>
+    The address and the base port where the dfs namenode web ui will listen on.
+    If the port is 0 then the server will start on a free port.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.https.enable</name>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>security</group>
+        <definition>
+            <en>Whether to support HTTPS</en>
+        </definition>
+        <description>
+            <en>Decide if HTTPS(SSL) is supported on HDFS
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.https.need.client.auth</name>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>security</group>
+        <definition>
+            <en>Whether require SSL client certificate authentication</en>
+        </definition>
+        <description>
+            <en>Whether SSL client certificate authentication is required
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.https.server.keystore.resource</name>
+        <value>ssl-server.xml</value>
+        <valuetype>String</valuetype>
+        <group>security</group>
+        <definition>
+            <en>Resource file to extract SSL server keystore information</en>
+        </definition>
+        <description>
+            <en>Resource file from which ssl server keystore
+  information will be extracted
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.https.client.keystore.resource</name>
+        <value>ssl-client.xml</value>
+        <valuetype>String</valuetype>
+        <group>security</group>
+        <definition>
+            <en>Resource file to extract SSL client keystore information</en>
+        </definition>
+        <description>
+            <en>Resource file from which ssl client keystore
+  information will be extracted
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.datanode.https.address</name>
+        <value>0.0.0.0:50475</value>
+        <valuetype>String</valuetype>
+        <group>datanode</group>
+        <definition>
+            <en>Datanode https server address and port</en>
+        </definition>
+        <description>
+            <en>
+    The datanode https server address and port.
+    If the port is 0 then the server will start on a free port.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.https.address</name>
+        <value>0.0.0.0:50470</value>
+        <valuetype>String</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>dfs https address and port</en>
+        </definition>
+        <description>
+            <en>dfs https address and port</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.datanode.dns.interface</name>
+        <value>default</value>
+        <valuetype>String</valuetype>
+        <group>datanode</group>
+        <definition>
+            <en>Network Interface name from which Datanode should report its IP address</en>
+        </definition>
+        <description>
+            <en>The name of the Network Interface from which a data node should
+  report its IP address.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.datanode.dns.nameserver</name>
+        <value>default</value>
+        <valuetype>String</valuetype>
+        <group>datanode</group>
+        <definition>
+            <en>Datanode name server address</en>
+        </definition>
+        <description>
+            <en>The host name or IP address of the name server (DNS)
+  which a DataNode should use to determine the host name used by the
+  NameNode for communication and display purposes.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.replication.considerLoad</name>
+        <value>true</value>
+        <valuetype>Boolean</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>Whether chooseTarget considers the target's load or not</en>
+        </definition>
+        <description>
+            <en>Decide if chooseTarget considers the target's load or not
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.default.chunk.view.size</name>
+        <value>32768</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>Chunk size to view on a browser</en>
+        </definition>
+        <description>
+            <en>The number of bytes to view for a file on the browser.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.datanode.du.reserved</name>
+        <value>0</value>
+        <valuetype>Integer</valuetype>
+        <group>datanode</group>
+        <definition>
+            <en>Reserved space in bytes per volume</en>
+        </definition>
+        <description>
+            <en>Reserved space in bytes per volume. Always leave this much space free for non dfs use.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.name.dir</name>
+        <value>/hadoop/drbd/hadoop_image,/hadoop/hadoop_image_local</value>
+        <valuetype>Directory</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>DFS fsimage file directory</en>
+        </definition>
+        <description>
+            <en>Determines where on the local filesystem the DFS name node
+      should store the name table(fsimage).  If this is a comma-delimited list
+      of directories then the name table is replicated in all of the
+      directories, for redundancy. </en>
+        </description>
+    <sectionname>NameNode-system</sectionname>
+    <form>TextItem</form>
+    </property>
+    <property>
+        <name>dfs.name.edits.dir</name>
+        <value>${dfs.name.dir}</value>
+        <valuetype>Directory</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>DFS edits file directory</en>
+        </definition>
+        <description>
+            <en>Determines where on the local filesystem the DFS name node
+      should store the transaction (edits) file. If this is a comma-delimited list
+      of directories then the transaction file is replicated in all of the
+      directories, for redundancy. Default value is same as dfs.name.dir
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.web.ugi</name>
+        <value>webuser,webgroup</value>
+        <valuetype>String</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>user account used by the web interface</en>
+        </definition>
+        <description>
+            <en>The user account used by the web interface.
+    Syntax: USERNAME,GROUP1,GROUP2, ...
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.permissions</name>
+        <readonly>true</readonly>
+        <value>true</value>
+        <valuetype>Boolean</valuetype>
+        <group>security</group>
+        <definition>
+            <en>Whether enable permission checking in HDFS</en>
+        </definition>
+        <description>
+            <en>
+    If "true", enable permission checking in HDFS.
+    If "false", permission checking is turned off,
+    but all other behavior is unchanged.
+    Switching from one parameter value to the other does not change the mode,
+    owner or group of files or directories.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.permissions.extended</name>
+        <readonly>true</readonly>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>security</group>
+        <definition>
+            <en>Whether to enable permission extension in HDFS</en>
+        </definition>
+        <description>
+            <en>
+    If "true", enable permission extension in HDFS.
+    If "false", permission extension is turned off.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.permissions.extended.permissions.file</name>
+        <readonly>true</readonly>
+        <value></value>
+        <valuetype>String</valuetype>
+        <allowempty>true</allowempty>
+        <group>security</group>
+        <definition>
+            <en>Configuration file for extension rules</en>
+        </definition>
+        <description>
+            <en>
+    If extended permissions is enabled, then the needed configuration file should be
+    configured here for extension rules.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.permissions.supergroup</name>
+        <value>supergroup</value>
+        <valuetype>String</valuetype>
+        <group>security</group>
+        <definition>
+            <en>super-users group name</en>
+        </definition>
+        <description>
+            <en>The name of the group of super-users.</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.block.access.token.enable</name>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>security</group>
+        <definition>
+            <en>Access tokens for accessing datanodes</en>
+        </definition>
+        <description>
+            <en>
+    If "true", access tokens are used as capabilities for accessing datanodes.
+    If "false", no access tokens are checked on accessing datanodes.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.block.access.key.update.interval</name>
+        <value>600</value>
+        <valuetype>Integer</valuetype>
+        <group>security</group>
+        <definition>
+            <en>Interval at which namenode updates its access keys</en>
+        </definition>
+        <description>
+            <en>
+    Interval in minutes at which namenode updates its access keys.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.block.access.token.lifetime</name>
+        <value>600</value>
+        <valuetype>Integer</valuetype>
+        <group>security</group>
+        <definition>
+            <en>Access tokens lifetime</en>
+        </definition>
+        <description>
+            <en>The lifetime of access tokens in minutes.</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.data.dir</name>
+        <value>${hadoop.tmp.dir}/dfs/data</value>
+        <intel_default>${hadoop.tmp.dir}/dfs/data</intel_default>
+        <recommendation></recommendation>
+        <valuetype>Directory</valuetype>
+        <allowempty>false</allowempty>
+        <script>'export dirs=`ruby /usr/lib/intelcloud/scripts/mounts.rb 2>/dev/null`;if [ "$dirs" == "" ]; then echo "/hadoop/data"; else for dir in $dirs; do echo $dir/hadoop/data; done; fi' </script>
+        <group>basic</group>
+        <definition>
+            <en>Local filesystem directory datanode stores its blocks</en>
+        </definition>
+        <description>
+            <en>Determines where on the local filesystem an DFS data node
+  should store its blocks.  If this is a comma-delimited
+  list of directories, then data will be stored in all named
+  directories, typically on different devices.
+  Directories that do not exist are ignored.
+</en>
+        </description>
+        <type>2</type>
+    </property>
+    <property>
+        <name>dfs.datanode.data.dir.perm</name>
+        <value>755</value>
+        <intel_default>755</intel_default>
+        <recommendation>755</recommendation>
+        <valuetype>Integer</valuetype>
+        <group>security</group>
+        <definition>
+            <en>Local filesystem directory permissions</en>
+        </definition>
+        <description>
+            <en>Permissions for the directories on on the local filesystem where
+  the DFS data node store its blocks. The permissions can either be octal or
+  symbolic.</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.replication</name>
+        <value>3</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>Block replication count</en>
+        </definition>
+        <description>
+            <en>Default block replication.
+  The actual number of replications can be specified when the file is created.
+  The default is used if replication is not specified in create time.
+</en>
+        </description>
+    <sectionname>basic</sectionname>
+    <form>TextItem</form>
+    </property>
+    <property>
+        <name>dfs.replication.max</name>
+        <value>512</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>Maximal block replication count</en>
+        </definition>
+        <description>
+            <en>Maximal block replication.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.replication.min</name>
+        <value>1</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>Minimal block replication count</en>
+        </definition>
+        <description>
+            <en>Minimal block replication.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.block.size</name>
+        <value>67108864</value>
+        <intel_default>67108864</intel_default>
+        <recommendation>134217728</recommendation>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>Default block size</en>
+        </definition>
+        <description>
+            <en>The default block size for new files.</en>
+        </description>
+    <sectionname>basic</sectionname>
+    <form>TextItem</form>
+    </property>
+    <property>
+        <name>dfs.df.interval</name>
+        <value>60000</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>Disk usage statistics refresh interval</en>
+        </definition>
+        <description>
+            <en>Disk usage statistics refresh interval in msec.</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.client.block.write.retries</name>
+        <value>3</value>
+        <valuetype>Integer</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>Writing to datanodes retry times</en>
+        </definition>
+        <description>
+            <en>The number of retries for writing blocks to the data nodes,
+  before we signal failure to the application.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.blockreport.intervalMsec</name>
+        <value>3600000</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>Block reporting interval</en>
+        </definition>
+        <description>
+            <en>Determines block reporting interval in milliseconds.</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.blockreport.initialDelay</name>
+        <value>0</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>Delay for first block report</en>
+        </definition>
+        <description>
+            <en>Delay for first block report in seconds.</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.datanode.directoryscan.interval</name>
+        <value>21600</value>
+        <valuetype>Integer</valuetype>
+        <group>datanode</group>
+        <definition>
+            <en>Datanode scan data interval</en>
+        </definition>
+        <description>
+            <en>Interval in seconds for Datanode to scan data directories and
+  reconcile the difference between blocks in memory and on the disk.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.datanode.directoryscan.threads</name>
+        <value>1</value>
+        <valuetype>Integer</valuetype>
+        <group>datanode</group>
+        <definition>
+            <en>Number of threads to use when scanning volumes to
+  generate block reports</en>
+        </definition>
+        <description>
+            <en>Number of threads to use when scanning volumes to
+  generate block reports. A value greater than one means
+  volumes will be scanned in parallel.</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.heartbeat.interval</name>
+        <value>3</value>
+        <valuetype>Integer</valuetype>
+        <group>datanode</group>
+        <definition>
+            <en>Datanode heartbeat</en>
+        </definition>
+        <description>
+            <en>Determines datanode heartbeat interval in seconds.</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.namenode.handler.count</name>
+        <value>10</value>
+        <intel_default>10</intel_default>
+        <recommendation>100</recommendation>
+        <valuetype>Integer</valuetype>
+        <group>namenode</group>
+        <definition>
+            <en>Namenode server threads count</en>
+        </definition>
+        <description>
+            <en>The number of server threads for the namenode.</en>
+        </description>
+        <sectionname>NameNode-system</sectionname>
+        <form>TextItem</form>
+    </property>
+    <property>
+        <name>dfs.safemode.threshold.pct</name>
+        <value>0.999f</value>
+        <valuetype>Float</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>percentage of blocks that should satisfy
+    the minimal replication requirement defined by dfs.replication.min.
+</en>
+        </definition>
+        <description>
+            <en>
+    Specifies the percentage of blocks that should satisfy
+    the minimal replication requirement defined by dfs.replication.min.
+    Values less than or equal to 0 mean not to wait for any particular
+    percentage of blocks before exiting safemode.
+    Values greater than 1 will make safe mode permanent.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.safemode.min.datanodes</name>
+        <value>0</value>
+        <valuetype>Integer</valuetype>
+        <hide>true</hide>
+        <group>basic</group>
+        <definition>
+            <en>number of datanodes that must be considered alive
+    before the name node exits safemode.</en>
+        </definition>
+        <description>
+            <en>
+    Specifies the number of datanodes that must be considered alive
+    before the name node exits safemode.
+    Values less than or equal to 0 mean not to take the number of live
+    datanodes into account when deciding whether to remain in safe mode
+    during startup.
+    Values greater than the number of datanodes in the cluster
+    will make safe mode permanent.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.safemode.extension</name>
+        <value>30000</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>Safe mode extension time</en>
+        </definition>
+        <description>
+            <en>
+    Determines extension of safe mode in milliseconds
+    after the threshold level is reached.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.balance.bandwidthPerSec</name>
+        <value>1048576</value>
+        <intel_default>1048576</intel_default>
+        <recommendation>104857600</recommendation>
+        <valuetype>Integer</valuetype>
+        <group>datanode</group>
+        <definition>
+            <en>Maximal amount of bandwidth that each datanode
+        can utilize for the balancing purpose</en>
+        </definition>
+        <description>
+            <en>
+        Specifies the maximal amount of bandwidth that each datanode
+        can utilize for the balancing purpose in terms of
+        the number of bytes per second.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.hosts</name>
+        <value></value>
+        <valuetype>String</valuetype>
+        <allowempty>true</allowempty>
+        <group>basic</group>
+        <definition>
+            <en>File that contains a list of hosts
+  permitted to connect to the namenode</en>
+        </definition>
+        <description>
+            <en>Names a file that contains a list of hosts that are
+  permitted to connect to the namenode. The full pathname of the file
+  must be specified.  If the value is empty, all hosts are
+  permitted.</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.hosts.exclude</name>
+        <value></value>
+        <valuetype>String</valuetype>
+        <allowempty>true</allowempty>
+        <group>basic</group>
+        <definition>
+            <en>File that contains a list of hosts
+  not permitted to connect to the namenode</en>
+        </definition>
+        <description>
+            <en>Names a file that contains a list of hosts that are
+  not permitted to connect to the namenode.  The full pathname of the
+  file must be specified.  If the value is empty, no hosts are
+  excluded.</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.max.objects</name>
+        <value>0</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>The maximum number of files, directories and blocks
+  dfs supports</en>
+        </definition>
+        <description>
+            <en>The maximum number of files, directories and blocks
+  dfs supports. A value of zero indicates no limit to the number
+  of objects that dfs supports.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.namenode.decommission.interval</name>
+        <value>30</value>
+        <valuetype>Integer</valuetype>
+        <group>namenode</group>
+        <definition>
+            <en>Namenode periodicity to check if decommission is complete</en>
+        </definition>
+        <description>
+            <en>Namenode periodicity in seconds to check if decommission is
+  complete.</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.namenode.decommission.nodes.per.interval</name>
+        <value>5</value>
+        <valuetype>Integer</valuetype>
+        <group>namenode</group>
+        <definition>
+            <en>The number of nodes namenode checks if decommission is complete</en>
+        </definition>
+        <description>
+            <en>The number of nodes namenode checks if decommission is complete
+  in each dfs.namenode.decommission.interval.</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.replication.interval</name>
+        <value>3</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>The periodicity in seconds with which the namenode computes
+  repliaction work for datanodes.</en>
+        </definition>
+        <description>
+            <en>The periodicity in seconds with which the namenode computes
+  repliaction work for datanodes. </en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.access.time.precision</name>
+        <value>3600000</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>HDFS file access time precision</en>
+        </definition>
+        <description>
+            <en>The access time for HDFS file is precise upto this value.
+               The default value is 1 hour. Setting a value of 0 disables
+               access times for HDFS.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.support.append</name>
+        <value>true</value>
+        <valuetype>Boolean</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>Whether HDFS allows appends</en>
+        </definition>
+        <description>
+            <en>Does HDFS allow appends to files?</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.datanode.plugins</name>
+        <value></value>
+        <valuetype>String</valuetype>
+        <allowempty>true</allowempty>
+        <group>datanode</group>
+        <definition>
+            <en>Datanode plugins to be activated</en>
+        </definition>
+        <description>
+            <en>Comma-separated list of datanode plug-ins to be activated.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.namenode.plugins</name>
+        <value></value>
+        <valuetype>String</valuetype>
+        <allowempty>true</allowempty>
+        <group>namenode</group>
+        <definition>
+            <en>Namenode plugins to be activated</en>
+        </definition>
+        <description>
+            <en>Comma-separated list of namenode plug-ins to be activated.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.datanode.failed.volumes.tolerated</name>
+        <value>0</value>
+        <valuetype>Integer</valuetype>
+        <group>datanode</group>
+        <definition>
+            <en>The number of volumes that are allowed to
+  fail before a datanode stops offering service</en>
+        </definition>
+        <description>
+            <en>The number of volumes that are allowed to
+  fail before a datanode stops offering service. By default
+  any volume failure will cause a datanode to shutdown.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.namenode.delegation.key.update-interval</name>
+        <value>86400000</value>
+        <valuetype>Integer</valuetype>
+        <group>namenode</group>
+        <definition>
+            <en>Namenode delegation key update interval</en>
+        </definition>
+        <description>
+            <en>The update interval for master key for delegation tokens
+       in the namenode in milliseconds.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.namenode.delegation.token.max-lifetime</name>
+        <value>604800000</value>
+        <valuetype>Integer</valuetype>
+        <group>namenode</group>
+        <definition>
+            <en>Namenode delegation key maximum lifetime</en>
+        </definition>
+        <description>
+            <en>The maximum lifetime in milliseconds for which a delegation
+      token is valid.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.namenode.delegation.token.renew-interval</name>
+        <value>86400000</value>
+        <valuetype>Integer</valuetype>
+        <group>namenode</group>
+        <definition>
+            <en>Namenode delegation key renewal interval</en>
+        </definition>
+        <description>
+            <en>The renewal interval for delegation token in milliseconds.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.drbd.name.dir</name>
+        <value>/hadoop/drbd</value>
+        <valuetype>Directory</valuetype>
+        <hide>true</hide>
+        <reserved>true</reserved>
+        <group>basic</group>
+        <definition>
+            <en>Remote backup directory</en>
+        </definition>
+        <description>
+            <en>Setting remote backup directory, this directory must be set in "dfs.name.dir".</en>
+        </description>
+    <sectionname>NameNode-system</sectionname>
+    <form>TextItem</form>
+    </property>
+    <property>
+        <name>hdfs.shortcut.reader.user</name>
+        <value></value>
+        <valuetype>String</valuetype>
+        <allowempty>true</allowempty>
+        <reserved>true</reserved>
+        <group>datanode</group>
+        <definition>
+            <en>User when reading local data in datanode</en>
+        </definition>
+        <description>
+            <en>Which user do you want to use when reading local data in datanode.
+    Empty value will disable the feature.</en>
+        </description>
+    </property>
+    <property>
+        <name>namenode.memory.weight</name>
+        <value></value>
+        <recommendation>50</recommendation>
+        <valuetype>Integer</valuetype>
+        <global>true</global>
+        <group>namenode</group>
+        <definition>
+            <en>Weight of namenode heapsize</en>
+        </definition>
+        <description>
+            <en>The weight of namenode heapsize and the default value is 50.</en>
+        </description>
+    <sectionname>advanced</sectionname>
+    <form>TextItem</form>
+    </property>
+    <property>
+        <name>secondary.namenode.memory.weight</name>
+        <value></value>
+        <recommendation>50</recommendation>
+        <valuetype>Integer</valuetype>
+        <global>true</global>
+        <group>namenode</group>
+        <definition>
+            <en>Weight of secondary namenode heapsize</en>
+        </definition>
+        <description>
+            <en>The weight of secondary namenode heapsize and the default value is 50.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.socket.timeout</name>
+        <value>120000</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>Timeout for socket connection</en>
+        </definition>
+        <description>
+            <en>Timeout for socket connection.</en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.replication.adjust</name>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>replication</group>
+        <definition>
+            <en>Whether to adjust the replication count</en>
+        </definition>
+        <description>
+            <en>
+     If it is true, adjust the number of replication according to visiting numbers of blocks.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.replication.historyWindow</name>
+        <value>1440</value>
+        <valuetype>Integer</valuetype>
+        <group>replication</group>
+        <definition>
+            <en>Retention cycle time</en>
+        </definition>
+        <description>
+            <en>
+     Determines retention cycle time of file visit statistics,(in Minutes), The default value is 1 day.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.replication.adjustTimer</name>
+        <value>720</value>
+        <valuetype>Integer</valuetype>
+        <group>replication</group>
+        <definition>
+            <en>Replication adjusting interval</en>
+        </definition>
+        <description>
+            <en>
+    Determines the file's replication adjusting interval(in Minutes), The default value is 6 hours.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.replication.adjust.maxPercent</name>
+        <value>0.1</value>
+        <valuetype>Float</valuetype>
+        <group>replication</group>
+        <definition>
+            <en>Replica adjusting max percentage of disk space</en>
+        </definition>
+        <description>
+            <en>
+     The max percentage of disk space for replica adjusting.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.replication.reserved.datanode.number.percent</name>
+        <value>0.1</value>
+        <valuetype>Float</valuetype>
+        <group>replication</group>
+        <definition>
+            <en>Percentage of datanode numbers reserved to others</en>
+        </definition>
+        <description>
+            <en>
+     The percentage of Datanode numbers for reserving to others.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>dfs.replication.adjust.blockWeight</name>
+        <value>10</value>
+        <valuetype>Integer</valuetype>
+        <group>replication</group>
+        <definition>
+            <en>Number of blocks for adjust weight</en>
+        </definition>
+        <description>
+            <en>
+     The number of blocks to be regarded as a basic unit for adjust weight.
+  </en>
+        </description>
+    </property>
+    <!--
+    <property>
+        <name>dfs_namenode_name_dir</name>
+        <value>/hadoop/drbd/hadoop_image,/hadoop/hadoop_image_local</value>
+        <valuetype>String</valuetype>
+        <group>namenode</group>
+        <definition>
+            <en>NameNode Directory</en>
+        </definition>
+        <sectionname>NameNode-system</sectionname>
+        <description>
+            <en>Determines where on the local filesystem the DFS name node should store the name table(fsimage).  If this is a comma-delimited list of directories then the name table is replicated in all of the directories, for redundancy.</en>
+        </description>
+        <form>TextItem</form>
+    </property>
+    -->
+    <briefsection>
+        <sectionname>basic</sectionname>
+        <name_en>HDFS Basic</name_en>
+        <autoexpand>true</autoexpand>
+        <showdescription>false</showdescription>
+    </briefsection>
+    <briefsection>
+        <sectionname>NameNode-system</sectionname>
+        <name_en>NameNode Configuration</name_en>
+        <autoexpand>true</autoexpand>
+        <showdescription>false</showdescription>
+        <description_en>""</description_en>
+    </briefsection>
+    <briefsection>
+        <sectionname>advanced</sectionname>
+        <name_en>Advanced Configuration</name_en>
+        <autoexpand>true</autoexpand>
+        <showdescription>false</showdescription>
+        <description_en>""</description_en>
+    </briefsection>
+    <group>
+        <id>basic</id>
+        <name_en>Basic Configuration</name_en>
+        <description_en>Basic configurations that get HDFS running.</description_en>
+    </group>
+    <group>
+        <id>perf</id>
+        <name_en>Performance</name_en>
+        <description_en>Configurations that affect Hadoop's performance</description_en>
+    </group>
+    <group>
+        <id>namenode</id>
+        <name_en>Namenode Configuration</name_en>
+        <description_en>Configurations for Namenode.</description_en>
+    </group>
+    <group>
+        <id>datanode</id>
+        <name_en>Datanode Configuration</name_en>
+        <description_en>Configurations for Datanode.</description_en>
+    </group>
+    <group>
+        <id>security</id>
+        <name_en>Security</name_en>
+        <description_en>Security configurations like permission control.</description_en>
+    </group>
+    <group>
+        <id>replication</id>
+        <name_en>Replication</name_en>
+        <description_en>Configurations for replication</description_en>
+    </group>
+</configuration>
diff --git a/savanna/plugins/intel/resources/mapred-default.xml b/savanna/plugins/intel/resources/mapred-default.xml
new file mode 100644
index 00000000..107f962a
--- /dev/null
+++ b/savanna/plugins/intel/resources/mapred-default.xml
@@ -0,0 +1,2678 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<?xml-stylesheet type="text/xsl" href="configuration.xsl"?>
+<!-- Do not modify this file directly. Instead, copy entries that you -->
+<!-- wish to modify from this file into mapred-site.xml and change them -->
+<!-- there. If mapred-site.xml does not already exist, create it. -->
+<configuration xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+    xsi:noNamespaceSchemaLocation="configuration.xsd">
+    <property>
+        <name>hadoop.jobtracker.memory</name>
+        <value>4096</value>
+        <valuetype>Integer</valuetype>
+        <group>jobtracker</group>
+        <definition>
+            <en>JobTracker server memory size</en>
+        </definition>
+        <type>1</type>
+        <automatic>true</automatic>
+        <reserved>true</reserved>
+        <description>
+            <en>Default size for jobtracker server memory.</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.tasktracker.slot.memory</name>
+        <value>4096</value>
+        <valuetype>Integer</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>Total memory size for tasktracker map and reduce slot</en>
+        </definition>
+        <type>1</type>
+        <automatic>true</automatic>
+        <reserved>true</reserved>
+        <description>
+            <en>Total memory size for tasktracker map and reduce slot.</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.tasktracker.memory</name>
+        <value>4096</value>
+        <valuetype>Integer</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>Default size for tasktracker server memory</en>
+        </definition>
+        <type>1</type>
+        <automatic>true</automatic>
+        <reserved>true</reserved>
+        <description>
+            <en>Default size for tasktracker server memory.</en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.job.history.location</name>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>String</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>job history location</en>
+        </definition>
+        <description>
+            <en> If job tracker is static the history files are stored
+  in this single well known place. If No value is set here, by default,
+  it is in the local file system at ${hadoop.log.dir}/history.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.job.history.user.location</name>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>String</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>user specified history location</en>
+        </definition>
+        <description>
+            <en> User can specify a location to store the history files of
+  a particular job. If nothing is specified, the logs are stored in
+  output directory. The files are stored in "_logs/history/" in the directory.
+  User can stop logging by giving the value "none".
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.job.tracker.history.completed.location</name>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>String</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>The completed job history files location</en>
+        </definition>
+        <description>
+            <en> The completed job history files are stored at this single well
+  known location. If nothing is specified, the files are stored at
+  ${hadoop.job.history.location}/done.
+  </en>
+        </description>
+    </property>
+    <!-- i/o properties -->
+    <property>
+        <name>io.sort.factor</name>
+        <value>10</value>
+        <intel_default>10</intel_default>
+        <recommendation>100</recommendation>
+        <valuetype>Integer</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>IO sort factor</en>
+        </definition>
+        <description>
+            <en>The number of streams to merge at once while sorting
+  files.  This determines the number of open file handles.</en>
+        </description>
+    </property>
+    <property>
+        <name>io.sort.mb</name>
+        <value>100</value>
+        <intel_default>100</intel_default>
+                <recommendation>200</recommendation>
+        <valuetype>Integer</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>Total amount of buffer memory to use while sorting
+  files,</en>
+        </definition>
+        <description>
+            <en>The total amount of buffer memory to use while sorting
+  files, in megabytes.  By default, gives each merge stream 1MB, which
+  should minimize seeks.</en>
+        </description>
+    </property>
+    <property>
+        <name>io.sort.record.percent</name>
+        <value>0.05</value>
+        <valuetype>Float</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>The percentage of io.sort.mb dedicated to tracking record
+  boundaries</en>
+        </definition>
+        <description>
+            <en>The percentage of io.sort.mb dedicated to tracking record
+  boundaries. Let this value be r, io.sort.mb be x. The maximum number
+  of records collected before the collection thread must block is equal
+  to (r * x) / 4</en>
+        </description>
+    </property>
+    <property>
+        <name>io.sort.spill.percent</name>
+        <value>0.80</value>
+        <valuetype>Float</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>buffer limit</en>
+        </definition>
+        <description>
+            <!-- not sure what it means -->
+            <en>The soft limit in either the buffer or record collection
+  buffers. Once reached, a thread will begin to spill the contents to disk
+  in the background. Note that this does not imply any chunking of data to
+  the spill. A value less than 0.5 is not recommended.</en>
+        </description>
+    </property>
+    <property>
+        <name>io.map.index.skip</name>
+        <value>0</value>
+        <valuetype>Integer</valuetype>
+        <group>io</group>
+        <definition>
+            <en>Number of index entries to skip between each entry</en>
+        </definition>
+        <description>
+            <en>Number of index entries to skip between each entry.
+  Zero by default. Setting this to values larger than zero can
+  facilitate opening large map files using less memory.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.job.tracker</name>
+        <enable>false</enable>
+        <value>local</value>
+        <recommendation></recommendation>
+        <allowempty>true</allowempty>
+        <valuetype>String</valuetype>
+        <group>jobtracker</group>
+        <definition>
+            <en>The host and port that the MapReduce job tracker runs
+  at</en>
+        </definition>
+        <description>
+            <en>The host that the MapReduce job tracker runs
+  at.  If "local", then jobs are run in-process as a single map
+  and reduce task.
+  </en>
+        </description>
+    </property>
+  <property>
+    <name>mapred.jobtracker</name>
+    <readonly>true</readonly>
+    <value></value>
+    <allowempty>true</allowempty>
+    <valuetype>String</valuetype>
+    <global>true</global>
+    <group>jobtracker</group>
+    <definition>
+      <en>The address that the job tracker runs at</en>
+    </definition>
+    <sectionname>directory</sectionname>
+    <description>
+      <en>The host and port that the MapReduce job tracker runs
+  at.  If "local", then jobs are run in-process as a single map
+  and reduce task.
+  </en>
+    </description>
+    <form>TextItem</form>
+  </property>
+    <property>
+        <name>mapred.jobtracker.port</name>
+        <value>54311</value>
+        <valuetype>Integer</valuetype>
+        <group>jobtracker</group>
+        <definition>
+            <en>The port that the MapReduce job tracker runs
+  at</en>
+        </definition>
+        <global>true</global>
+        <description>
+            <en>The port that the MapReduce job tracker runs
+  at.  If "local", then jobs are run in-process as a single map
+  and reduce task.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>hadoop.jobtracker.thrift.port</name>
+        <value>9290</value>
+        <valuetype>Integer</valuetype>
+        <group>jobtracker</group>
+        <definition>
+            <en>The port for jobtracker thrift server.</en>
+        </definition>
+        <global>true</global>
+        <description>
+            <en>The port for jobtracker thrift server.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.job.tracker.http.address</name>
+        <value>0.0.0.0:50030</value>
+        <valuetype>String</valuetype>
+        <group>jobtracker</group>
+        <definition>
+            <en>The job tracker http server address and port</en>
+        </definition>
+        <description>
+            <en>
+    The job tracker http server address and port the server will listen on.
+    If the port is 0 then the server will start on a free port.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.job.tracker.handler.count</name>
+        <value>10</value>
+        <intel_default>10</intel_default>
+                 <recommendation>60</recommendation>
+        <valuetype>Integer</valuetype>
+        <group>jobtracker</group>
+        <definition>
+            <en>The number of server threads for the JobTracker.</en>
+        </definition>
+        <description>
+            <en>
+    The number of server threads for the JobTracker. This should be roughly
+    4% of the number of tasktracker nodes.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.task.tracker.report.address</name>
+        <value>127.0.0.1:0</value>
+        <valuetype>String</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>The interface and port that task tracker server listens on</en>
+        </definition>
+        <description>
+            <en>The interface and port that task tracker server listens on.
+  Since it is only connected to by the tasks, it uses the local interface.
+  EXPERT ONLY. Should only be changed if your host does not have the loopback
+  interface.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.local.dir</name>
+        <value>${hadoop.tmp.dir}/mapred/local</value>
+        <recommendation></recommendation>
+        <allowempty>true</allowempty>
+        <valuetype>Directory</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>MapReduce local directory</en>
+        </definition>
+        <script>'export dirs=`ruby /usr/lib/intelcloud/scripts/mounts.rb 2>/dev/null`;if [ "$dirs" == "" ]; then echo "/hadoop/mapred"; else for dir in $dirs; do echo $dir/hadoop/mapred; done; fi' </script>
+        <type>2</type>
+        <description>
+            <en>The local directory where MapReduce stores intermediate
+  data files.  May be a comma-separated list of
+  directories on different devices in order to spread disk i/o.
+  Directories that do not exist are ignored.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.system.dir</name>
+        <value>${hadoop.tmp.dir}/mapred/system</value>
+        <valuetype>Directory</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>The directory where MapReduce stores control files.</en>
+        </definition>
+        <enable>false</enable>
+        <description>
+            <en>The directory where MapReduce stores control files.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapreduce.jobtracker.staging.root.dir</name>
+        <value>${hadoop.tmp.dir}/mapred/staging</value>
+        <valuetype>Directory</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>The root of the staging area for users' job files</en>
+        </definition>
+        <enable>false</enable>
+        <description>
+            <en>The root of the staging area for users' job files
+  In practice, this should be the directory where users' home
+  directories are located (usually /user)
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.temp.dir</name>
+        <value>${hadoop.tmp.dir}/mapred/temp</value>
+        <valuetype>Directory</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>A shared directory for temporary files.</en>
+        </definition>
+        <enable>false</enable>
+        <description>
+            <en>A shared directory for temporary files.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.local.dir.minspacestart</name>
+        <value>0</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>minimum space in mapred.local.dir to start task</en>
+        </definition>
+        <description>
+            <en>If the space in mapred.local.dir drops under this,
+  do not ask for more tasks. Value in bytes.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.local.dir.minspacekill</name>
+        <value>0</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>mapred.local.dir minimum space kill</en>
+        </definition>
+        <description>
+            <en>If the space in mapred.local.dir drops under this,
+    do not ask more tasks until all the current ones have finished and
+    cleaned up. Also, to save the rest of the tasks we have running,
+    kill one of them, to clean up some space. Start with the reduce tasks,
+    then go with the ones that have finished the least.
+    Value in bytes.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.tasktracker.expiry.interval</name>
+        <value>600000</value>
+        <intel_default>600000</intel_default>
+                <recommendation>180000</recommendation>
+        <valuetype>Integer</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>TaskTracker expiry interval</en>
+        </definition>
+        <description>
+            <en>Expert: The time-interval, in miliseconds, after which
+  a tasktracker is declared 'lost' if it doesn't send heartbeats.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.tasktracker.instrumentation</name>
+        <enable>false</enable>
+        <value>org.apache.hadoop.mapred.TaskTrackerMetricsSource</value>
+        <valuetype>Class</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>TaskTracker instrumentation class</en>
+        </definition>
+        <description>
+            <en>Expert: The instrumentation class to associate with each TaskTracker.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.tasktracker.resourcecalculatorplugin</name>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>String</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>tasktracker resource calculator plugin</en>
+        </definition>
+        <description>
+            <en>
+   Name of the class whose instance will be used to query resource information
+   on the tasktracker.The class must be an instance of
+   org.apache.hadoop.util.ResourceCalculatorPlugin. If the value is null, the
+   tasktracker attempts to use a class appropriate to the platform.
+   Currently, the only platform supported is Linux.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.tasktracker.taskmemorymanager.monitoring-interval</name>
+        <value>5000</value>
+        <valuetype>Integer</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>TaskTracker monitoring interval</en>
+        </definition>
+        <description>
+            <en>The interval, in milliseconds, for which the tasktracker waits
+   between two cycles of monitoring its tasks' memory usage. Used only if
+   tasks' memory management is enabled via mapred.tasktracker.tasks.maxmemory.
+   </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.tasktracker.tasks.sleeptime-before-sigkill</name>
+        <value>5000</value>
+        <valuetype>Integer</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>TaskTracker sleeptime before sending a SIGKILL</en>
+        </definition>
+        <description>
+            <en>The time, in milliseconds, the tasktracker waits for sending a
+  SIGKILL to a process, after it has been sent a SIGTERM.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.map.tasks</name>
+        <value>2</value>
+        <valuetype>Integer</valuetype>
+        <group>map</group>
+        <definition>
+            <en>map count</en>
+        </definition>
+        <description>
+            <en>The default number of map tasks per job.
+  Ignored when mapred.job.tracker is "local".
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.reduce.tasks</name>
+        <value>1</value>
+        <valuetype>Integer</valuetype>
+        <group>reduce</group>
+        <definition>
+            <en>reduce count</en>
+        </definition>
+        <description>
+            <!-- in a single wave? -->
+            <en>The default number of reduce tasks per job. Typically set to 99%
+  of the cluster's reduce capacity, so that if a node fails the reduces can
+  still be executed in a single wave.
+  Ignored when mapred.job.tracker is "local".
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapreduce.tasktracker.outofband.heartbeat</name>
+        <value>false</value>
+        <recommendation>true</recommendation>
+        <valuetype>Boolean</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>TaskTracker out-of-band heartbeat</en>
+        </definition>
+        <description>
+            <en>Expert: Set this to true to let the tasktracker send an
+  out-of-band heartbeat on task-completion for better latency.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapreduce.tasktracker.outofband.heartbeat.damper</name>
+        <value>1000000</value>
+        <valuetype>Integer</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>out-of-band heartbeat damper</en>
+        </definition>
+        <description>
+            <en>When out-of-band heartbeats are enabled, provides
+  damping to avoid overwhelming the JobTracker if too many out-of-band
+  heartbeats would occur. The damping is calculated such that the
+  heartbeat interval is divided by (T*D + 1) where T is the number
+  of completed tasks and D is the damper value.
+  Setting this to a high value like the default provides no damping --
+  as soon as any task finishes, a heartbeat will be sent. Setting this
+  parameter to 0 is equivalent to disabling the out-of-band heartbeat feature.
+  A value of 1 would indicate that, after one task has completed, the
+  time to wait before the next heartbeat would be 1/2 the usual time.
+  After two tasks have finished, it would be 1/3 the usual time, etc.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.jobtracker.restart.recover</name>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>job</group>
+        <definition>
+            <en>Whether enable job recovery</en>
+        </definition>
+        <description>
+            <en>"true" to enable (job) recovery upon restart,
+               "false" to start afresh
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.jobtracker.job.history.block.size</name>
+        <value>3145728</value>
+        <valuetype>Integer</valuetype>
+        <group>job</group>
+        <definition>
+            <en>The block size of the job history file</en>
+        </definition>
+        <description>
+            <en>The block size of the job history file. Since the job recovery
+               uses job history, its important to dump job history to disk as
+               soon as possible. Note that this is an expert level parameter.
+               The default value is set to 3 MB.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapreduce.job.split.metainfo.maxsize</name>
+        <value>10000000</value>
+        <valuetype>Integer</valuetype>
+        <group>job</group>
+        <definition>
+            <en>The maximum permissible size of the split metainfo file</en>
+        </definition>
+        <description>
+            <en>The maximum permissible size of the split metainfo file.
+  The JobTracker won't attempt to read split metainfo files bigger than
+  the configured value.
+  No limits if set to -1.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.jobtracker.taskScheduler</name>
+        <enable>false</enable>
+        <value>org.apache.hadoop.mapred.JobQueueTaskScheduler</value>
+        <valuetype>Class</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>The class responsible for scheduling the tasks.</en>
+        </definition>
+        <description>
+            <en>The class responsible for scheduling the tasks.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.jobtracker.taskScheduler.maxRunningTasksPerJob</name>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>Integer</valuetype>
+        <group>job</group>
+        <definition>
+            <en>The maximum number of running tasks for a job before
+  it gets preempted</en>
+        </definition>
+        <enable>false</enable>
+        <description>
+            <en>The maximum number of running tasks for a job before
+  it gets preempted. No limits if undefined.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.map.max.attempts</name>
+        <value>4</value>
+        <valuetype>Integer</valuetype>
+        <group>map</group>
+        <definition>
+            <en>Map maximum attempt times</en>
+        </definition>
+        <description>
+            <en>Expert: The maximum number of attempts per map task.
+  In other words, framework will try to execute a map task these many number
+  of times before giving up on it.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.reduce.max.attempts</name>
+        <value>4</value>
+        <valuetype>Integer</valuetype>
+        <group>reduce</group>
+        <definition>
+            <en>Reduce maximum attempt times</en>
+        </definition>
+        <description>
+            <en>Expert: The maximum number of attempts per reduce task.
+  In other words, framework will try to execute a reduce task these many number
+  of times before giving up on it.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.reduce.parallel.copies</name>
+        <value>5</value>
+        <recommendation>20</recommendation>
+        <valuetype>Integer</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>The default number of parallel transfers run by reduce
+  during the copy(shuffle) phase</en>
+        </definition>
+        <description>
+            <en>The default number of parallel transfers run by reduce
+  during the copy(shuffle) phase.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapreduce.reduce.shuffle.maxfetchfailures</name>
+        <value>10</value>
+        <valuetype>Integer</valuetype>
+        <group>reduce</group>
+        <definition>
+            <en>reducer maximum fetch failures</en>
+        </definition>
+        <description>
+            <en>The maximum number of times a reducer tries to
+  fetch a map output before it reports it.
+</en>
+        </description>
+    </property>
+    <property>
+        <name>mapreduce.reduce.shuffle.connect.timeout</name>
+        <value>180000</value>
+        <valuetype>Integer</valuetype>
+        <group>reduce</group>
+        <definition>
+            <en>reducer connect timeout</en>
+        </definition>
+        <description>
+            <en>Expert: The maximum amount of time (in milli seconds) a reduce
+  task spends in trying to connect to a tasktracker for getting map output.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapreduce.reduce.shuffle.read.timeout</name>
+        <value>180000</value>
+        <valuetype>Integer</valuetype>
+        <group>reduce</group>
+        <definition>
+            <en>reducer read timeout</en>
+        </definition>
+        <description>
+            <en>Expert: The maximum amount of time (in milli seconds) a reduce
+  task waits for map output data to be available for reading after obtaining
+  connection.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.task.timeout</name>
+        <value>600000</value>
+                <recommendation>180000</recommendation>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>task timeout value</en>
+        </definition>
+        <description>
+            <en>The number of milliseconds before a task will be
+  terminated if it neither reads an input, writes an output, nor
+  updates its status string.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.tasktracker.map.tasks.maximum</name>
+        <value>2</value>
+        <recommendation></recommendation>
+        <allowempty>true</allowempty>
+        <valuetype>Integer</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>The maximum number of map tasks that will be run
+  simultaneously by a task tracker</en>
+        </definition>
+        <automatic>true</automatic>
+        <script>'cat /proc/cpuinfo | grep processor | wc -l'</script>
+        <type>2</type>
+        <description>
+            <en>The maximum number of map tasks that will be run
+  simultaneously by a task tracker.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.tasktracker.reduce.tasks.maximum</name>
+        <value>2</value>
+        <recommendation></recommendation>
+        <allowempty>true</allowempty>
+        <valuetype>Integer</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>The maximum number of reduce tasks that will be run
+  simultaneously by a task tracker.</en>
+        </definition>
+        <automatic>true</automatic>
+        <script>'echo $[`cat /proc/cpuinfo | grep processor | wc -l` / 2]'</script>
+        <type>2</type>
+        <description>
+            <en>The maximum number of reduce tasks that will be run
+  simultaneously by a task tracker.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.jobtracker.completeuserjobs.maximum</name>
+        <value>100</value>
+        <valuetype>Integer</valuetype>
+        <group>job</group>
+        <definition>
+            <en>maximum number of complete jobs to keep around per user</en>
+        </definition>
+        <description>
+            <en>The maximum number of complete jobs per user to keep around
+  before delegating them to the job history.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapreduce.reduce.input.limit</name>
+        <value>-1</value>
+        <valuetype>Integer</valuetype>
+        <group>reduce</group>
+        <definition>
+            <en>The limit on the input size of the reduce</en>
+        </definition>
+        <description>
+            <en>The limit on the input size of the reduce. If the estimated
+  input size of the reduce is greater than this value, job is failed. A
+  value of -1 means that there is no limit set. </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.job.tracker.retiredjobs.cache.size</name>
+        <value>1000</value>
+        <valuetype>Integer</valuetype>
+        <group>job</group>
+        <definition>
+            <en>The number of retired job status to keep in the cache.</en>
+        </definition>
+        <description>
+            <en>The number of retired job status to keep in the cache.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.job.tracker.jobhistory.lru.cache.size</name>
+        <value>5</value>
+        <valuetype>Integer</valuetype>
+        <group>job</group>
+        <definition>
+            <en>The number of job history files loaded in memory</en>
+        </definition>
+        <description>
+            <en>The number of job history files loaded in memory. The jobs are
+  loaded when they are first accessed. The cache is cleared based on LRU.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.jobtracker.instrumentation</name>
+        <enable>false</enable>
+        <value>org.apache.hadoop.mapred.JobTrackerMetricsSource</value>
+        <valuetype>Class</valuetype>
+        <group>jobtracker</group>
+        <definition>
+            <en>JobTracker instrumentation class</en>
+        </definition>
+        <description>
+            <en>Expert: The instrumentation class to associate with each JobTracker.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.child.java.opts</name>
+        <value>-Xmx200m</value>
+        <recommendation>-Xmx512m -XX:+UseConcMarkSweepGC -XX:ParallelCMSThreads=1 -XX:ParallelGCThreads=1</recommendation>
+        <allowempty>true</allowempty>
+        <valuetype>String</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>Java opts for the task tracker child processes</en>
+        </definition>
+        <description>
+            <en>Java opts for the task tracker child processes.
+  The following symbol, if present, will be interpolated: @taskid@ is replaced
+  by current TaskID. Any other occurrences of '@' will go unchanged.
+  For example, to enable verbose gc logging to a file named for the taskid in
+  /tmp and to set the heap maximum to be a gigabyte, pass a 'value' of:
+        -Xmx1024m -verbose:gc -Xloggc:/tmp/@taskid@.gc
+  The configuration variable mapred.child.ulimit can be used to control the
+  maximum virtual memory of the child processes.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.child.heapsize</name>
+        <value>200</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>The JVM heapsize used by each map task and reduce task.</en>
+        </definition>
+        <hide>true</hide>
+        <reserved>true</reserved>
+        <description>
+            <en>The JVM heapsize used by each map task and reduce task.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.child.env</name>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>Integer</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>tasktracker child process environment variable</en>
+        </definition>
+        <description>
+            <en>User added environment variables for the task tracker child
+  processes. Example :
+  1) A=foo  This will set the env variable A to foo
+  2) B=$B:c This is inherit tasktracker's B env variable.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.child.ulimit</name>
+        <value></value>
+        <allowempty>true</allowempty>
+<!-- The type is changed from Integer to String, as we want to support old config value like ulimited, it will treated as -1 in server -->
+        <valuetype>String</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>MapReduce maximum virtual memory</en>
+        </definition>
+        <description>
+            <en>The maximum virtual memory, in KB, of a process launched by the
+  Map-Reduce framework. This can be used to control both the Mapper/Reducer
+  tasks and applications using Hadoop Pipes, Hadoop Streaming etc.
+  By default it is left unspecified to let cluster admins control it via
+  limits.conf and other such relevant mechanisms.
+  Note: mapred.child.ulimit must be greater than or equal to the -Xmx passed to
+  JavaVM, else the VM might not start.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.cluster.map.memory.mb</name>
+        <value>-1</value>
+        <valuetype>Integer</valuetype>
+        <group>map</group>
+        <definition>
+            <en>map virtual memory size</en>
+        </definition>
+        <description>
+            <en>The size, in terms of virtual memory, of a single map slot
+  in the Map-Reduce framework, used by the scheduler.
+  A job can ask for multiple slots for a single map task via
+  mapred.job.map.memory.mb, upto the limit specified by
+  mapred.cluster.max.map.memory.mb, if the scheduler supports the feature.
+  The value of -1 indicates that this feature is turned off.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.cluster.reduce.memory.mb</name>
+        <value>-1</value>
+        <valuetype>Integer</valuetype>
+        <group>reduce</group>
+        <definition>
+            <en>reduce virtual memory size</en>
+        </definition>
+        <description>
+            <en>The size, in terms of virtual memory, of a single reduce slot
+  in the Map-Reduce framework, used by the scheduler.
+  A job can ask for multiple slots for a single reduce task via
+  mapred.job.reduce.memory.mb, upto the limit specified by
+  mapred.cluster.max.reduce.memory.mb, if the scheduler supports the feature.
+  The value of -1 indicates that this feature is turned off.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.cluster.max.map.memory.mb</name>
+        <value>-1</value>
+        <valuetype>Integer</valuetype>
+        <group>map</group>
+        <definition>
+            <en>map maximum virtual memory size</en>
+        </definition>
+        <description>
+            <en>The maximum size, in terms of virtual memory, of a single map
+  task launched by the Map-Reduce framework, used by the scheduler.
+  A job can ask for multiple slots for a single map task via
+  mapred.job.map.memory.mb, upto the limit specified by
+  mapred.cluster.max.map.memory.mb, if the scheduler supports the feature.
+  The value of -1 indicates that this feature is turned off.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.cluster.max.reduce.memory.mb</name>
+        <value>-1</value>
+        <valuetype>Integer</valuetype>
+        <group>reduce</group>
+        <definition>
+            <en>reduce maximum virtual memory size</en>
+        </definition>
+        <description>
+            <en>The maximum size, in terms of virtual memory, of a single reduce
+  task launched by the Map-Reduce framework, used by the scheduler.
+  A job can ask for multiple slots for a single reduce task via
+  mapred.job.reduce.memory.mb, upto the limit specified by
+  mapred.cluster.max.reduce.memory.mb, if the scheduler supports the feature.
+  The value of -1 indicates that this feature is turned off.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.job.map.memory.mb</name>
+        <value>-1</value>
+        <valuetype>Integer</valuetype>
+        <group>map</group>
+        <definition>
+            <en>map virtual memory size</en>
+        </definition>
+        <description>
+            <en>The size, in terms of virtual memory, of a single map task
+  for the job.
+  A job can ask for multiple slots for a single map task, rounded up to the
+  next multiple of mapred.cluster.map.memory.mb and upto the limit
+  specified by mapred.cluster.max.map.memory.mb, if the scheduler supports
+  the feature.
+  The value of -1 indicates that this feature is turned off iff
+  mapred.cluster.map.memory.mb is also turned off (-1).
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.job.reduce.memory.mb</name>
+        <value>-1</value>
+        <valuetype>Integer</valuetype>
+        <group>reduce</group>
+        <definition>
+            <en>reduce virtual memory size</en>
+        </definition>
+        <description>
+            <en>The size, in terms of virtual memory, of a single reduce task
+  for the job.
+  A job can ask for multiple slots for a single map task, rounded up to the
+  next multiple of mapred.cluster.reduce.memory.mb and upto the limit
+  specified by mapred.cluster.max.reduce.memory.mb, if the scheduler supports
+  the feature.
+  The value of -1 indicates that this feature is turned off iff
+  mapred.cluster.reduce.memory.mb is also turned off (-1).
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.child.tmp</name>
+        <value>./tmp</value>
+        <valuetype>String</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>tmp directory for map and reduce tasks</en>
+        </definition>
+        <description>
+            <en> To set the value of tmp directory for map and reduce tasks.
+  If the value is an absolute path, it is directly assigned. Otherwise, it is
+  prepended with task's working directory. The java tasks are executed with
+  option -Djava.io.tmpdir='the absolute path of the tmp dir'. Pipes and
+  streaming are set with environment variable,
+   TMPDIR='the absolute path of the tmp dir'
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.inmem.merge.threshold</name>
+        <value>1000</value>
+        <valuetype>Integer</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>in-memory merge threshold</en>
+        </definition>
+        <description>
+            <en>The threshold, in terms of the number of files
+  for the in-memory merge process. When we accumulate threshold number of files
+  we initiate the in-memory merge and spill to disk. A value of 0 or less than
+  0 indicates we want to DON'T have any threshold and instead depend only on
+  the ramfs's memory consumption to trigger the merge.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.job.shuffle.merge.percent</name>
+        <value>0.66</value>
+        <valuetype>Float</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>The usage threshold at which an in-memory merge will be
+  initiated</en>
+        </definition>
+        <description>
+            <en>The usage threshold at which an in-memory merge will be
+  initiated, expressed as a percentage of the total memory allocated to
+  storing in-memory map outputs, as defined by
+  mapred.job.shuffle.input.buffer.percent.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.job.shuffle.input.buffer.percent</name>
+        <value>0.70</value>
+        <valuetype>Float</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>memory to store map outputs during the shuffle</en>
+        </definition>
+        <description>
+            <en>The percentage of memory to be allocated from the maximum heap
+  size to storing map outputs during the shuffle.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.job.reduce.input.buffer.percent</name>
+        <value>0.0</value>
+        <valuetype>Float</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>The percentage of memory- relative to the maximum heap size- to
+  retain map outputs during the reduce</en>
+        </definition>
+        <description>
+            <en>The percentage of memory- relative to the maximum heap size- to
+  retain map outputs during the reduce. When the shuffle is concluded, any
+  remaining map outputs in memory must consume less than this threshold before
+  the reduce can begin.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.map.tasks.speculative.execution</name>
+        <value>true</value>
+        <intel_default>true</intel_default>
+        <valuetype>Boolean</valuetype>
+        <group>map</group>
+        <definition>
+            <en>whether to execute multiple instances of map task in parallel</en>
+        </definition>
+        <description>
+            <en>If true, then multiple instances of some map tasks
+               may be executed in parallel.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.reduce.tasks.speculative.execution</name>
+        <value>true</value>
+        <intel_default>true</intel_default>
+                <recommendation>false</recommendation>
+        <valuetype>Boolean</valuetype>
+        <group>reduce</group>
+        <definition>
+            <en>whether to execute multiple instances of reduce task in parallel</en>
+        </definition>
+        <description>
+            <en>If true, then multiple instances of some reduce tasks
+               may be executed in parallel.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.job.reuse.jvm.num.tasks</name>
+        <value>1</value>
+        <valuetype>Integer</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>Number of taks to run per jvm</en>
+        </definition>
+        <description>
+            <en>How many tasks to run per jvm. If set to -1, there is
+  no limit.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.min.split.size</name>
+        <value>0</value>
+        <valuetype>Integer</valuetype>
+        <group>map</group>
+        <definition>
+            <en>The minimum size chunk that map input should be split
+  into</en>
+        </definition>
+        <description>
+            <en>The minimum size chunk that map input should be split
+  into.  Note that some file formats may have minimum split sizes that
+  take priority over this setting.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.jobtracker.maxtasks.per.job</name>
+        <value>-1</value>
+        <valuetype>Integer</valuetype>
+        <group>job</group>
+        <definition>
+            <en>The maximum number of tasks for a single job</en>
+        </definition>
+        <description>
+            <en>The maximum number of tasks for a single job.
+  A value of -1 indicates that there is no maximum.  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.submit.replication</name>
+        <value>10</value>
+        <valuetype>Integer</valuetype>
+        <group>job</group>
+        <definition>
+            <en>The replication level for submitted job files</en>
+        </definition>
+        <description>
+            <en>The replication level for submitted job files.  This
+  should be around the square root of the number of nodes.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.tasktracker.dns.interface</name>
+        <value>default</value>
+        <valuetype>String</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>The name of the Network Interface from which a task
+  tracker should report its IP address</en>
+        </definition>
+        <description>
+            <en>The name of the Network Interface from which a task
+  tracker should report its IP address.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.tasktracker.dns.nameserver</name>
+        <value>default</value>
+        <valuetype>String</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>TaskTracker name server address</en>
+        </definition>
+        <description>
+            <en>The host name or IP address of the name server (DNS)
+  which a TaskTracker should use to determine the host name used by
+  the JobTracker for communication and display purposes.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>tasktracker.http.threads</name>
+        <value>40</value>
+        <intel_default>40</intel_default>
+        <recommendation>60</recommendation>
+        <valuetype>Integer</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>The number of worker threads that for the http server</en>
+        </definition>
+        <description>
+            <en>The number of worker threads that for the http server. This is
+               used for map output fetching
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.task.tracker.http.address</name>
+        <value>0.0.0.0:50060</value>
+        <valuetype>String</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>The task tracker http server address and port</en>
+        </definition>
+        <description>
+            <en>
+    The task tracker http server address and port.
+    If the port is 0 then the server will start on a free port.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>keep.failed.task.files</name>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>Whether to keep files for failed tasks</en>
+        </definition>
+        <description>
+            <en>Should the files for failed tasks be kept. This should only be
+               used on jobs that are failing, because the storage is never
+               reclaimed. It also prevents the map outputs from being erased
+               from the reduce directory as they are consumed.</en>
+        </description>
+    </property>
+    <!-- <property> <name>keep.task.files.pattern</name> <value>.*_m_123456_0</value><valuetype>Integer</valuetype>
+ <en></en></definition>
+ <en>Keep all files from tasks whose task names match
+        the given regular expression. Defaults to none.</en></description> </property> -->
+    <property>
+        <name>mapred.output.compress</name>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>job</group>
+        <definition>
+            <en>Whether to compress job output</en>
+        </definition>
+        <description>
+            <en>Should the job outputs be compressed?
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.output.compression.type</name>
+        <value>RECORD</value>
+        <intel_default>RECORD</intel_default>
+        <recommendation>BLOCK</recommendation>
+        <valuetype>String</valuetype>
+        <group>job</group>
+        <definition>
+            <en>compress type of job outputs</en>
+        </definition>
+        <description>
+            <en>If the job outputs are to compressed as SequenceFiles, how should
+               they be compressed? Should be one of NONE, RECORD or BLOCK.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.output.compression.codec</name>
+        <value>org.apache.hadoop.io.compress.DefaultCodec</value>
+        <valuetype>Class</valuetype>
+        <group>job</group>
+        <definition>
+            <en>job outputs compress codec class</en>
+        </definition>
+        <description>
+            <en>If the job outputs are compressed, how should they be compressed?
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.compress.map.output</name>
+        <value>false</value>
+        <intel_default>false</intel_default>
+                <recommendation>true</recommendation>
+        <valuetype>Boolean</valuetype>
+        <group>map</group>
+        <definition>
+            <en>Whether to compress map outputs</en>
+        </definition>
+        <description>
+            <en>Should the outputs of the maps be compressed before being
+               sent across the network. Uses SequenceFile compression.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.map.output.compression.codec</name>
+        <value>org.apache.hadoop.io.compress.DefaultCodec</value>
+        <intel_default>org.apache.hadoop.io.compress.DefaultCodec</intel_default>
+                <recommendation>org.apache.hadoop.io.compress.SnappyCodec</recommendation>
+        <valuetype>Class</valuetype>
+        <group>map</group>
+        <definition>
+            <en>map outputs compression class</en>
+        </definition>
+        <description>
+            <en>If the map outputs are compressed, how should they be
+               compressed?
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>map.sort.class</name>
+        <value>org.apache.hadoop.util.QuickSort</value>
+        <valuetype>Class</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>The default sort class for sorting keys.</en>
+        </definition>
+        <description>
+            <en>The default sort class for sorting keys.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.userlog.limit.kb</name>
+        <value>0</value>
+        <valuetype>Integer</valuetype>
+        <group>user</group>
+        <definition>
+            <en>The maximum size of user-logs of each task in KB</en>
+        </definition>
+        <description>
+            <en>The maximum size of user-logs of each task in KB. 0 disables the cap.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.userlog.retain.hours</name>
+        <value>24</value>
+        <valuetype>Integer</valuetype>
+        <group>user</group>
+        <definition>
+            <en>user log maximum retain hours</en>
+        </definition>
+        <description>
+            <en>The maximum time, in hours, for which the user-logs are to be
+               retained after the job completion.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.user.jobconf.limit</name>
+        <value>5242880</value>
+        <valuetype>Integer</valuetype>
+        <group>user</group>
+        <definition>
+            <en>The maximum allowed size of the user jobconf</en>
+        </definition>
+        <description>
+            <en>The maximum allowed size of the user jobconf. The
+  default is set to 5 MB</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.hosts</name>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>Integer</valuetype>
+        <group>jobtracker</group>
+        <definition>
+            <en>Names a file that contains the list of nodes that may
+  connect to the jobtracker.</en>
+        </definition>
+        <description>
+            <en>Names a file that contains the list of nodes that may
+  connect to the jobtracker.  If the value is empty, all hosts are
+  permitted.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.hosts.exclude</name>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>String</valuetype>
+        <group>jobtracker</group>
+        <definition>
+            <en>Names a file that contains the list of hosts that
+  should be excluded by the jobtracker</en>
+        </definition>
+        <description>
+            <en>Names a file that contains the list of hosts that
+  should be excluded by the jobtracker.  If the value is empty, no
+  hosts are excluded.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.heartbeats.in.second</name>
+        <value>100</value>
+        <valuetype>Integer</valuetype>
+        <group>jobtracker</group>
+        <definition>
+            <en>Approximate number of heart-beats that could arrive
+               at JobTracker in a second</en>
+        </definition>
+        <description>
+            <en>Expert: Approximate number of heart-beats that could arrive
+               at JobTracker in a second. Assuming each RPC can be processed
+               in 10msec, the default value is made 100 RPCs in a second.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.max.tracker.blacklists</name>
+        <value>4</value>
+        <valuetype>Integer</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>TaskTracker maximum number of blacklists</en>
+        </definition>
+        <description>
+            <en>The number of blacklists for a tasktracker by various jobs
+               after which the tasktracker will be marked as potentially
+               faulty and is a candidate for graylisting across all jobs.
+               (Unlike blacklisting, this is advisory; the tracker remains
+               active.  However, it is reported as graylisted in the web UI,
+               with the expectation that chronically graylisted trackers
+               will be manually decommissioned.)  This value is tied to
+               mapred.jobtracker.blacklist.fault-timeout-window; faults
+               older than the window width are forgiven, so the tracker
+               will recover from transient problems.  It will also become
+               healthy after a restart.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.jobtracker.blacklist.fault-timeout-window</name>
+        <value>180</value>
+        <valuetype>Integer</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>The timeout (in minutes) after which per-job tasktracker
+               faults are forgiven</en>
+        </definition>
+        <description>
+            <en>The timeout (in minutes) after which per-job tasktracker
+               faults are forgiven.  The window is logically a circular
+               buffer of time-interval buckets whose width is defined by
+               mapred.jobtracker.blacklist.fault-bucket-width; when the
+               "now" pointer moves across a bucket boundary, the previous
+               contents (faults) of the new bucket are cleared.  In other
+               words, the timeout's granularity is determined by the bucket
+               width.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.jobtracker.blacklist.fault-bucket-width</name>
+        <value>15</value>
+        <valuetype>Integer</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>TaskTracker fault timeout window bucket width</en>
+        </definition>
+        <description>
+            <en>The width (in minutes) of each bucket in the tasktracker
+               fault timeout window.  Each bucket is reused in a circular
+               manner after a full timeout-window interval (defined by
+               mapred.jobtracker.blacklist.fault-timeout-window).
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.max.tracker.failures</name>
+        <value>4</value>
+        <valuetype>Integer</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>TaskTracker maximum failures</en>
+        </definition>
+        <description>
+            <en>The number of task-failures on a tasktracker of a given job
+               after which new tasks of that job aren't assigned to it.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>jobclient.output.filter</name>
+        <value>FAILED</value>
+        <valuetype>String</valuetype>
+        <group>user</group>
+        <definition>
+            <en>he filter for controlling the output of the task's userlogs sent
+               to the console of the JobClient</en>
+        </definition>
+        <description>
+            <en>The filter for controlling the output of the task's userlogs sent
+               to the console of the JobClient.
+               The permissible options are: NONE, KILLED, FAILED, SUCCEEDED and
+               ALL.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>jobclient.completion.poll.interval</name>
+        <value>5000</value>
+        <valuetype>Integer</valuetype>
+        <group>user</group>
+        <definition>
+            <en>JobClient polling JobTracker interval</en>
+        </definition>
+        <description>
+            <en>The interval (in milliseconds) between which the JobClient
+    polls the JobTracker for updates about job status. You may want to set this
+    to a lower value to make tests run faster on a single node system. Adjusting
+    this value in production may lead to unwanted client-server traffic.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>jobclient.progress.monitor.poll.interval</name>
+        <value>1000</value>
+        <valuetype>Integer</valuetype>
+        <group>user</group>
+        <definition>
+            <en>The interval (in milliseconds) between which the JobClient
+    reports status to the console and checks for job completion</en>
+        </definition>
+        <description>
+            <en>The interval (in milliseconds) between which the JobClient
+    reports status to the console and checks for job completion. You may want to set this
+    to a lower value to make tests run faster on a single node system. Adjusting
+    this value in production may lead to unwanted client-server traffic.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.job.tracker.persist.jobstatus.active</name>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>job</group>
+        <definition>
+            <en>Indicates if persistency of job status information is
+      active or not.</en>
+        </definition>
+        <description>
+            <en>Indicates if persistency of job status information is
+      active or not.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.job.tracker.persist.jobstatus.hours</name>
+        <value>0</value>
+        <valuetype>Integer</valuetype>
+        <group>job</group>
+        <definition>
+            <en>he number of hours job status information is persisted in DFS.</en>
+        </definition>
+        <description>
+            <en>The number of hours job status information is persisted in DFS.
+    The job status information will be available after it drops of the memory
+    queue and between jobtracker restarts. With a zero value the job status
+    information is not persisted at all in DFS.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.job.tracker.persist.jobstatus.dir</name>
+        <value>/jobtracker/jobsInfo</value>
+        <valuetype>Directory</valuetype>
+        <group>job</group>
+        <definition>
+            <en>The directory where the job status information is persisted</en>
+        </definition>
+        <description>
+            <en>The directory where the job status information is persisted
+      in a file system to be available after it drops of the memory queue and
+      between jobtracker restarts.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapreduce.job.complete.cancel.delegation.tokens</name>
+        <value>true</value>
+        <valuetype>Boolean</valuetype>
+        <group>job</group>
+        <definition>
+            <en>Whether to unregister delegation tokens from renewal</en>
+        </definition>
+        <description>
+            <en> if false - do not unregister/cancel delegation tokens
+    from renewal, because same tokens may be used by spawned jobs
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.task.profile</name>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>Whether to collect profiler information</en>
+        </definition>
+        <description>
+            <en>To set whether the system should collect profiler
+     information for some of the tasks in this job? The information is stored
+     in the user log directory. The value is "true" if task profiling
+     is enabled.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.task.profile.maps</name>
+        <value>0-2</value>
+        <valuetype>Int_range</valuetype>
+        <group>map</group>
+        <definition>
+            <en>ranges of map tasks to profile</en>
+        </definition>
+        <description>
+            <en> To set the ranges of map tasks to profile.
+    mapred.task.profile has to be set to true for the value to be accounted.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.task.profile.reduces</name>
+        <value>0-2</value>
+        <valuetype>Int_range</valuetype>
+        <group>reduce</group>
+        <definition>
+            <en>ranges of reduce tasks to profile</en>
+        </definition>
+        <description>
+            <en> To set the ranges of reduce tasks to profile.
+    mapred.task.profile has to be set to true for the value to be accounted.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.line.input.format.linespermap</name>
+        <value>1</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>Number of lines per split in NLineInputFormat</en>
+        </definition>
+        <description>
+            <en> Number of lines per split in NLineInputFormat.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.skip.attempts.to.start.skipping</name>
+        <value>2</value>
+        <valuetype>Integer</valuetype>
+        <group>skip</group>
+        <definition>
+            <en>he number of Task attempts AFTER which skip mode
+    will be kicked off</en>
+        </definition>
+        <description>
+            <en> The number of Task attempts AFTER which skip mode
+    will be kicked off. When skip mode is kicked off, the
+    tasks reports the range of records which it will process
+    next, to the TaskTracker. So that on failures, TT knows which
+    ones are possibly the bad records. On further executions,
+    those are skipped.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.skip.map.auto.incr.proc.count</name>
+        <value>true</value>
+        <valuetype>Boolean</valuetype>
+        <group>skip</group>
+        <definition>
+            <en>Whether to increment SkipBadRecords.COUNTER_MAP_PROCESSED_GROUPS</en>
+        </definition>
+        <description>
+            <en> The flag which if set to true,
+    SkipBadRecords.COUNTER_MAP_PROCESSED_RECORDS is incremented
+    by MapRunner after invoking the map function. This value must be set to
+    false for applications which process the records asynchronously
+    or buffer the input records. For example streaming.
+    In such cases applications should increment this counter on their own.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.skip.reduce.auto.incr.proc.count</name>
+        <value>true</value>
+        <valuetype>Boolean</valuetype>
+        <group>skip</group>
+        <definition>
+            <en>Whether to increment SkipBadRecords.COUNTER_REDUCE_PROCESSED_GROUPS</en>
+        </definition>
+        <description>
+            <en> The flag which if set to true,
+    SkipBadRecords.COUNTER_REDUCE_PROCESSED_GROUPS is incremented
+    by framework after invoking the reduce function. This value must be set to
+    false for applications which process the records asynchronously
+    or buffer the input records. For example streaming.
+    In such cases applications should increment this counter on their own.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.skip.out.dir</name>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>String</valuetype>
+        <group>skip</group>
+        <definition>
+            <en>skipped records output directory</en>
+        </definition>
+        <description>
+            <en> If no value is specified here, the skipped records are
+    written to the output directory at _logs/skip.
+    User can stop writing skipped records by giving the value "none".
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.skip.map.max.skip.records</name>
+        <value>0</value>
+        <valuetype>Integer</valuetype>
+        <group>skip</group>
+        <definition>
+            <en>The number of acceptable skip records surrounding the bad
+    record PER bad record in mapper</en>
+        </definition>
+        <description>
+            <en> The number of acceptable skip records surrounding the bad
+    record PER bad record in mapper. The number includes the bad record as well.
+    To turn the feature of detection/skipping of bad records off, set the
+    value to 0.
+    The framework tries to narrow down the skipped range by retrying
+    until this threshold is met OR all attempts get exhausted for this task.
+    Set the value to Long.MAX_VALUE to indicate that framework need not try to
+    narrow down. Whatever records(depends on application) get skipped are
+    acceptable.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.skip.reduce.max.skip.groups</name>
+        <value>0</value>
+        <valuetype>Integer</valuetype>
+        <group>skip</group>
+        <definition>
+            <en>The number of acceptable skip groups surrounding the bad
+    group PER bad group in reducer</en>
+        </definition>
+        <description>
+            <en> The number of acceptable skip groups surrounding the bad
+    group PER bad group in reducer. The number includes the bad group as well.
+    To turn the feature of detection/skipping of bad groups off, set the
+    value to 0.
+    The framework tries to narrow down the skipped range by retrying
+    until this threshold is met OR all attempts get exhausted for this task.
+    Set the value to Long.MAX_VALUE to indicate that framework need not try to
+    narrow down. Whatever groups(depends on application) get skipped are
+    acceptable.
+    </en>
+        </description>
+    </property>
+    <!-- Job Notification Configuration -->
+    <!-- <property> <name>job.end.notification.url</name> <value>http://localhost:8080/jobstatus.php?jobId=$jobId&amp;jobStatus=$jobStatus</value><valuetype>String</valuetype>
+ <en></en></definition>
+ <en>Indicates url which will be called on completion
+        of job to inform end status of job. User can give at most 2 variables with
+        URI : $jobId and $jobStatus. If they are present in URI, then they will be
+        replaced by their respective values. </en></description> </property> -->
+    <property>
+        <name>job.end.retry.attempts</name>
+        <value>0</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>hadoop retry attempts to contact notification URL</en>
+        </definition>
+        <description>
+            <en>Indicates how many times hadoop should attempt to contact the
+               notification URL </en>
+        </description>
+    </property>
+    <property>
+        <name>job.end.retry.interval</name>
+        <value>30000</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>notifcation URL retry interval</en>
+        </definition>
+        <description>
+            <en>Indicates time in milliseconds between notification URL retry
+                calls</en>
+        </description>
+    </property>
+    <!-- Proxy Configuration -->
+    <property>
+        <name>hadoop.rpc.socket.factory.class.JobSubmissionProtocol</name>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>String</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>SocketFactory to use to connect to a Map/Reduce master (JobTracker)</en>
+        </definition>
+        <description>
+            <en>SocketFactory to use to connect to a Map/Reduce master
+    (JobTracker). If null or empty, then use hadoop.rpc.socket.class.default.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.task.cache.levels</name>
+        <value>2</value>
+        <valuetype>Integer</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>max level of the task cache</en>
+        </definition>
+        <description>
+            <en> This is the max level of the task cache. For example, if
+    the level is 2, the tasks cached are at the host level and at the rack
+    level.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.queue.names</name>
+        <hide>false</hide>
+        <value>default</value>
+        <valuetype>String</valuetype>
+        <group>jobtracker</group>
+        <definition>
+            <en>list of queues configured for this jobtracker</en>
+        </definition>
+        <description>
+            <en> Comma separated list of queues configured for this jobtracker.
+    Jobs are added to queues and schedulers can configure different
+    scheduling properties for the various queues. To configure a property
+    for a queue, the name of the queue must match the name specified in this
+    value. Queue properties that are common to all schedulers are configured
+    here with the naming convention, mapred.queue.$QUEUE-NAME.$PROPERTY-NAME,
+    for e.g. mapred.queue.default.submit-job-acl.
+    The number of queues configured in this parameter could depend on the
+    type of scheduler being used, as specified in
+    mapred.jobtracker.taskScheduler. For example, the JobQueueTaskScheduler
+    supports only a single queue, which is the default configured here.
+    Before adding more queues, ensure that the scheduler you've configured
+    supports multiple queues.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.acls.enabled</name>
+        <readonly>true</readonly>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>Whether to enable ACL check</en>
+        </definition>
+        <description>
+            <en>Specifies whether ACLs should be checked
+    for authorization of users for doing various queue and job level operations.
+    ACLs are disabled by default. If enabled, access control checks are made by
+    JobTracker and TaskTracker when requests are made by users for queue
+    operations like submit job to a queue and kill a job in the queue and job
+    operations like viewing the job-details (See mapreduce.job.acl-view-job)
+    or for modifying the job (See mapreduce.job.acl-modify-job) using
+    Map/Reduce APIs, RPCs or via the console and web user interfaces.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.queue.default.state</name>
+        <value>RUNNING</value>
+        <valuetype>String</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>job state value</en>
+        </definition>
+        <description>
+            <en>
+   This values defines the state , default queue is in.
+   the values can be either "STOPPED" or "RUNNING"
+   This value can be changed at runtime.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.job.queue.name</name>
+        <value>default</value>
+        <valuetype>String</valuetype>
+        <group>job</group>
+        <definition>
+            <en>Queue to which a job is submitted</en>
+        </definition>
+        <description>
+            <en> Queue to which a job is submitted. This must match one of the
+    queues defined in mapred.queue.names for the system. Also, the ACL setup
+    for the queue must allow the current user to submit a job to the queue.
+    Before specifying a queue, ensure that the system is configured with
+    the queue, and access is allowed for submitting jobs to the queue.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapreduce.job.acl-modify-job</name>
+        <value></value>
+<!-- This is for compability, that old bin contains characters string with space. For AnyString, we will not do any validation -->
+        <valuetype>String</valuetype>
+        <allowempty>true</allowempty>
+        <group>job</group>
+        <definition>
+            <en>Job specific access-control list for 'modifying' the job</en>
+        </definition>
+        <description>
+            <en> Job specific access-control list for 'modifying' the job. It
+    is only used if authorization is enabled in Map/Reduce by setting the
+    configuration property mapred.acls.enabled to true.
+    This specifies the list of users and/or groups who can do modification
+    operations on the job. For specifying a list of users and groups the
+    format to use is "user1,user2 group1,group". If set to '*', it allows all
+    users/groups to modify this job. If set to ' '(i.e. space), it allows
+    none. This configuration is used to guard all the modifications with respect
+    to this job and takes care of all the following operations:
+      o killing this job
+      o killing a task of this job, failing a task of this job
+      o setting the priority of this job
+    Each of these operations are also protected by the per-queue level ACL
+    "acl-administer-jobs" configured via mapred-queues.xml. So a caller should
+    have the authorization to satisfy either the queue-level ACL or the
+    job-level ACL.
+    Irrespective of this ACL configuration, job-owner, the user who started the
+    cluster, cluster administrators configured via
+    mapreduce.cluster.administrators and queue administrators of the queue to
+    which this job is submitted to configured via
+    mapred.queue.queue-name.acl-administer-jobs  in mapred-queue-acls.xml can
+    do all the modification operations on a job.
+    By default, nobody else besides job-owner, the user who started the cluster,
+    cluster administrators and queue administrators can perform modification
+    operations on a job.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapreduce.job.acl-view-job</name>
+        <value></value>
+<!-- This is for compability, that old bin contains characters string with space. For AnyString, we will not do any validation -->
+        <valuetype>String</valuetype>
+        <allowempty>true</allowempty>
+        <group>job</group>
+        <definition>
+            <en>Job specific access-control list for 'viewing' the job</en>
+        </definition>
+        <description>
+            <en> Job specific access-control list for 'viewing' the job. It is
+    only used if authorization is enabled in Map/Reduce by setting the
+    configuration property mapred.acls.enabled to true.
+    This specifies the list of users and/or groups who can view private details
+    about the job. For specifying a list of users and groups the
+    format to use is "user1,user2 group1,group". If set to '*', it allows all
+    users/groups to view this job. If set to ' '(i.e. space), it allows
+    none. This configuration is used to guard some of the job-views and at
+    present only protects APIs that can return possibly sensitive information
+    of the job-owner like
+      o job-level counters
+      o task-level counters
+      o tasks' diagnostic information
+      o task-logs displayed on the TaskTracker web-UI and
+      o job.xml showed by the JobTracker's web-UI
+    Every other piece of information of jobs is still accessible by any other
+    user, for e.g., JobStatus, JobProfile, list of jobs in the queue, etc.
+    Irrespective of this ACL configuration, job-owner, the user who started the
+    cluster, cluster administrators configured via
+    mapreduce.cluster.administrators and queue administrators of the queue to
+    which this job is submitted to configured via
+    mapred.queue.queue-name.acl-administer-jobs in mapred-queue-acls.xml can do
+    all the view operations on a job.
+    By default, nobody else besides job-owner, the user who started the
+    cluster, cluster administrators and queue administrators can perform
+    view operations on a job.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.tasktracker.indexcache.mb</name>
+        <value>10</value>
+        <valuetype>Integer</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>The maximum memory that a task tracker allows for the index cache </en>
+        </definition>
+        <description>
+            <en> The maximum memory that a task tracker allows for the
+    index cache that is used when serving map outputs to reducers.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.combine.recordsBeforeProgress</name>
+        <value>10000</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en> The number of records to process during combine output collection
+   before sending a progress notification to the TaskTracker.</en>
+        </definition>
+        <description>
+            <en> The number of records to process during combine output collection
+   before sending a progress notification to the TaskTracker.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.merge.recordsBeforeProgress</name>
+        <value>10000</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en> The number of records to process during merge before
+   sending a progress notification to the TaskTracker.</en>
+        </definition>
+        <description>
+            <en> The number of records to process during merge before
+   sending a progress notification to the TaskTracker.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.reduce.slowstart.completed.maps</name>
+        <value>0.05</value>
+        <valuetype>Float</valuetype>
+        <group>job</group>
+        <definition>
+            <en>Fraction of the number of maps in the job which should be
+  complete before reduces are scheduled for the job</en>
+        </definition>
+        <description>
+            <en>Fraction of the number of maps in the job which should be
+  complete before reduces are scheduled for the job.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.task.tracker.task-controller</name>
+        <value>org.apache.hadoop.mapred.DefaultTaskController</value>
+        <valuetype>Class</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>TaskController which is used to launch and manage task execution </en>
+        </definition>
+        <description>
+            <en>TaskController which is used to launch and manage task execution </en>
+        </description>
+    </property>
+    <property>
+        <name>mapreduce.tasktracker.group</name>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>String</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>Group to which TaskTracker belongs</en>
+        </definition>
+        <description>
+            <en>Expert: Group to which TaskTracker belongs. If
+   LinuxTaskController is configured via mapreduce.tasktracker.taskcontroller,
+   the group owner of the task-controller binary should be same as this group.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.disk.healthChecker.interval</name>
+        <value>60000</value>
+        <valuetype>Integer</valuetype>
+        <group>health</group>
+        <definition>
+            <en>node health check interval</en>
+        </definition>
+        <description>
+            <en>How often the TaskTracker checks the health of its
+ local directories. Configuring this to a value smaller than the
+ heartbeat interval is equivalent to setting this to heartbeat
+ interval value.
+ </en>
+        </description>
+    </property>
+    <!-- Node health script variables -->
+    <property>
+        <name>mapred.healthChecker.script.path</name>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>Integer</valuetype>
+        <group>health</group>
+        <definition>
+            <en>node health script path</en>
+        </definition>
+        <description>
+            <en>Absolute path to the script which is
+  periodically run by the node health monitoring service to determine if
+  the node is healthy or not. If the value of this key is empty or the
+  file does not exist in the location configured here, the node health
+  monitoring service is not started.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.healthChecker.interval</name>
+        <value>60000</value>
+        <valuetype>Integer</valuetype>
+        <group>health</group>
+        <definition>
+            <en>Frequency of the node health script to be run </en>
+        </definition>
+        <description>
+            <en>Frequency of the node health script to be run </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.healthChecker.script.timeout</name>
+        <value>600000</value>
+        <valuetype>Integer</valuetype>
+        <group>health</group>
+        <definition>
+            <en>node health script timeout</en>
+        </definition>
+        <description>
+            <en>Time after node health script should be killed if
+  unresponsive and considered that the script has failed.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.healthChecker.script.args</name>
+        <value></value>
+        <allowempty>true</allowempty>
+        <valuetype>String</valuetype>
+        <group>health</group>
+        <definition>
+            <en>List of arguments which are to be passed to
+  node health script when it is being launched comma seperated.</en>
+        </definition>
+        <description>
+            <en>List of arguments which are to be passed to
+  node health script when it is being launched comma seperated.
+  </en>
+        </description>
+    </property>
+    <property>
+        <name>mapreduce.job.counters.limit</name>
+        <value>120</value>
+        <valuetype>Integer</valuetype>
+        <group>job</group>
+        <definition>
+            <en>Limit on the number of counters allowed per job.</en>
+        </definition>
+        <description>
+            <en>Limit on the number of counters allowed per job.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapreduce.slot.memory.weight</name>
+        <value></value>
+        <recommendation>50</recommendation>
+        <valuetype>Integer</valuetype>
+        <group>tasktracker</group>
+        <definition>
+            <en>TaskTracker reserve heapsize weight</en>
+        </definition>
+    <global>true</global>
+        <sectionname>directory</sectionname>
+        <description>
+            <en>The weight of tasktracker reserve heapsize and the default value is 50.</en>
+        </description>
+        <form>TextItem</form>
+    </property>
+    <!-- end of node health script variables -->
+    <property>
+        <name>mapred.scheduler</name>
+        <value>fair</value>
+        <valuetype>String</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>Task Schedule</en>
+        </definition>
+        <reserved>true</reserved>
+        <sectionname>advanced</sectionname>
+        <description>
+            <en>Map/Reduce Task schedule method. If the Capacity scheduler has been selected, then additional items need to be configured.</en>
+        </description>
+        <form>RadioGroupItem</form>
+        <radios>fair,capacity</radios>
+    </property>
+    <property>
+        <name>mapred.map.reduce.ratio</name>
+        <value>2</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>The map/reduce ratio.</en>
+        </definition>
+        <reserved>true</reserved>
+        <description>
+            <en>The map/reduce ratio.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.cpu.ratio.max</name>
+        <value>1.5</value>
+        <valuetype>Float</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>The cpu max usage ratio.</en>
+        </definition>
+        <reserved>true</reserved>
+        <description>
+            <en>The cpu max usage ratio.</en>
+        </description>
+    </property>
+    <!-- no description available -->
+    <property>
+        <name>mapred.fairscheduler.preemption</name>
+        <enable>false</enable>
+        <value>true</value>
+        <valuetype>Boolean</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>Whether to enable fairscheduler preemption.</en>
+        </definition>
+        <description>
+            <en>Whether to enable fairscheduler preemption.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.fairscheduler.assignmultiple</name>
+        <enable>false</enable>
+        <value>true</value>
+        <valuetype>Boolean</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>Whether to assign multiple</en>
+        </definition>
+        <description>
+            <en>Whether to assign multiple</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.fairscheduler.sizebasedweight</name>
+        <enable>false</enable>
+        <value>true</value>
+        <valuetype>Boolean</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>size based weight</en>
+        </definition>
+        <description>
+            <en>size based weight</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.fairscheduler.poolnameproperty</name>
+        <enable>false</enable>
+        <value>mapred.queue.name</value>
+        <valuetype>String</valuetype>
+        <group>perf</group>
+        <definition>
+            <en>pool name property</en>
+        </definition>
+        <description>
+            <en>job.set("mapred.queue.name",pool); // pool is set to either 'high' or 'low' </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.capacity-scheduler.maximum-system-jobs</name>
+        <value>3000</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>Maximum number of jobs in the system which can be initialized,
+     concurrently, by the CapacityScheduler</en>
+        </definition>
+        <description>
+            <en>Maximum number of jobs in the system which can be initialized,
+     concurrently, by the CapacityScheduler.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.capacity-scheduler.queue.default.capacity</name>
+        <value>100</value>
+        <valuetype>Integer</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>Percentage of the number of slots in the cluster that are
+      to be available for jobs in this queue.</en>
+        </definition>
+        <description>
+            <en>Percentage of the number of slots in the cluster that are
+      to be available for jobs in this queue.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.capacity-scheduler.queue.default.maximum-capacity</name>
+        <value>-1</value>
+        <valuetype>Integer</valuetype>
+        <group>scheduling</group>
+        <definition>
+            <en>per-queue maximum-capacity</en>
+        </definition>
+        <description>
+            <en>
+    maximum-capacity defines a limit beyond which a queue cannot use the capacity of the cluster.
+    This provides a means to limit how much excess capacity a queue can use. By default, there is no limit.
+    The maximum-capacity of a queue can only be greater than or equal to its minimum capacity.
+        Default value of -1 implies a queue can use complete capacity of the cluster.
+        This property could be to curtail certain jobs which are long running in nature from occupying more than a
+        certain percentage of the cluster, which in the absence of pre-emption, could lead to capacity guarantees of
+        other queues being affected.
+        One important thing to note is that maximum-capacity is a percentage , so based on the cluster's capacity
+        the max capacity would change. So if large number of nodes or racks get added to the cluster , max Capacity in
+        absolute terms would increase accordingly.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.capacity-scheduler.queue.default.supports-priority</name>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>scheduling</group>
+        <definition>
+            <en>Whether to take jobs' priorities into account in scheduling decisions</en>
+        </definition>
+        <description>
+            <en>If true, priorities of jobs will be taken into
+      account in scheduling decisions.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.capacity-scheduler.queue.default.minimum-user-limit-percent</name>
+        <value>100</value>
+        <valuetype>Integer</valuetype>
+        <group>scheduling</group>
+        <definition>
+            <en>maximum limit on per-user's allocated percentage of resources</en>
+        </definition>
+        <description>
+            <!-- can't understand the example -->
+            <en> Each queue enforces a limit on the percentage of resources
+    allocated to a user at any given time, if there is competition for them.
+    This user limit can vary between a minimum and maximum value. The former
+    depends on the number of users who have submitted jobs, and the latter is
+    set to this property value. For example, suppose the value of this
+    property is 25. If two users have submitted jobs to a queue, no single
+    user can use more than 50% of the queue resources. If a third user submits
+    a job, no single user can use more than 33% of the queue resources. With 4
+    or more users, no user can use more than 25% of the queue's resources. A
+    value of 100 implies no user limits are imposed.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.capacity-scheduler.queue.default.user-limit-factor</name>
+        <value>1</value>
+        <valuetype>Integer</valuetype>
+        <group>scheduling</group>
+        <definition>
+            <en>The multiple of the queue capacity which can be configured to
+    allow a single user to acquire more slots.
+    </en>
+        </definition>
+        <description>
+            <en>The multiple of the queue capacity which can be configured to
+    allow a single user to acquire more slots.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.capacity-scheduler.queue.default.maximum-initialized-active-tasks</name>
+        <value>200000</value>
+        <valuetype>Integer</valuetype>
+        <group>scheduling</group>
+        <definition>
+            <en>The maximum number of tasks, across all jobs in the queue,
+    which can be initialized concurrently.</en>
+        </definition>
+        <description>
+            <en>The maximum number of tasks, across all jobs in the queue,
+    which can be initialized concurrently. Once the queue's jobs exceed this
+    limit they will be queued on disk.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.capacity-scheduler.queue.default.maximum-initialized-active-tasks-per-user</name>
+        <value>100000</value>
+        <valuetype>Integer</valuetype>
+        <group>scheduling</group>
+        <definition>
+            <en>The maximum number of tasks per-user, across all the of the
+    user's jobs in the queue, which can be initialized concurrently</en>
+        </definition>
+        <description>
+            <en>The maximum number of tasks per-user, across all the of the
+    user's jobs in the queue, which can be initialized concurrently. Once the
+    user's jobs exceed this limit they will be queued on disk.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.capacity-scheduler.queue.default.init-accept-jobs-factor</name>
+        <value>10</value>
+        <valuetype>Integer</valuetype>
+        <group>scheduling</group>
+        <definition>
+            <en>The multipe of (maximum-system-jobs * queue-capacity) used to
+    determine the number of jobs which are accepted by the scheduler.</en>
+        </definition>
+        <description>
+            <en>The multipe of (maximum-system-jobs * queue-capacity) used to
+    determine the number of jobs which are accepted by the scheduler.</en>
+        </description>
+    </property>
+    <!-- The default configuration settings for the capacity task scheduler -->
+    <!-- The default values would be applied to all the queues which don't have -->
+    <!-- the appropriate property for the particular queue -->
+    <property>
+        <name>mapred.capacity-scheduler.default-supports-priority</name>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>scheduling</group>
+        <definition>
+            <en>If true, priorities of jobs will be taken into
+      account in scheduling decisions by default in a job queue.</en>
+        </definition>
+        <description>
+            <en>If true, priorities of jobs will be taken into
+      account in scheduling decisions by default in a job queue.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.capacity-scheduler.default-minimum-user-limit-percent</name>
+        <value>100</value>
+        <valuetype>Integer</valuetype>
+        <group>scheduling</group>
+        <definition>
+            <en>The percentage of the resources limited to a particular user
+      for the job queue at any given point of time by default.</en>
+        </definition>
+        <description>
+            <en>The percentage of the resources limited to a particular user
+      for the job queue at any given point of time by default.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.capacity-scheduler.default-user-limit-factor</name>
+        <value>1</value>
+        <valuetype>Integer</valuetype>
+        <group>scheduling</group>
+        <definition>
+            <en>The default multiple of queue-capacity which is used to
+    determine the amount of slots a single user can consume concurrently.
+    </en>
+        </definition>
+        <description>
+            <en>The default multiple of queue-capacity which is used to
+    determine the amount of slots a single user can consume concurrently.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.capacity-scheduler.default-maximum-active-tasks-per-queue</name>
+        <value>200000</value>
+        <valuetype>Integer</valuetype>
+        <group>scheduling</group>
+        <definition>
+            <en>The default maximum number of tasks, across all jobs in the
+    queue, which can be initialized concurrently</en>
+        </definition>
+        <description>
+            <en>The default maximum number of tasks, across all jobs in the
+    queue, which can be initialized concurrently. Once the queue's jobs exceed
+    this limit they will be queued on disk.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.capacity-scheduler.default-maximum-active-tasks-per-user</name>
+        <value>100000</value>
+        <valuetype>Integer</valuetype>
+        <group>scheduling</group>
+        <definition>
+            <en>The default maximum number of tasks per-user, across all the of
+    the user's jobs in the queue, which can be initialized concurrently</en>
+        </definition>
+        <description>
+            <en>The default maximum number of tasks per-user, across all the of
+    the user's jobs in the queue, which can be initialized concurrently. Once
+    the user's jobs exceed this limit they will be queued on disk.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.capacity-scheduler.default-init-accept-jobs-factor</name>
+        <value>10</value>
+        <valuetype>Integer</valuetype>
+        <group>scheduling</group>
+        <definition>
+            <en>The default multipe of (maximum-system-jobs * queue-capacity)
+    used to determine the number of jobs which are accepted by the scheduler.
+    </en>
+        </definition>
+        <description>
+            <en>The default multipe of (maximum-system-jobs * queue-capacity)
+    used to determine the number of jobs which are accepted by the scheduler.
+    </en>
+        </description>
+    </property>
+    <!-- Capacity scheduler Job Initialization configuration parameters -->
+    <property>
+        <name>mapred.capacity-scheduler.init-poll-interval</name>
+        <value>5000</value>
+        <valuetype>Integer</valuetype>
+        <group>scheduling</group>
+        <definition>
+            <en>The amount of time in miliseconds which is used to poll
+    the job queues for jobs to initialize.</en>
+        </definition>
+        <description>
+            <en>The amount of time in miliseconds which is used to poll
+    the job queues for jobs to initialize.</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.capacity-scheduler.init-worker-threads</name>
+        <value>5</value>
+        <valuetype>Integer</valuetype>
+        <group>scheduling</group>
+        <definition>
+            <en>Number of worker threads which would be used by
+    Initialization poller to initialize jobs in a set of queue</en>
+        </definition>
+        <description>
+            <en>Number of worker threads which would be used by
+    Initialization poller to initialize jobs in a set of queue.
+    If number mentioned in property is equal to number of job queues
+    then a single thread would initialize jobs in a queue. If lesser
+    then a thread would get a set of queues assigned. If the number
+    is greater then number of threads would be equal to number of
+    job queues.
+    </en>
+        </description>
+    </property>
+    <property>
+        <name>resmon.joblevel.metrics.enabled</name>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>basic</group>
+        <definition>
+            <en>Whether to enable joblevel metrics</en>
+        </definition>
+        <reserved>true</reserved>
+        <description>
+            <en>Whether to enable joblevel metrics</en>
+        </description>
+    </property>
+    <property>
+        <name>mapred.profiling</name>
+        <value>false</value>
+        <valuetype>Boolean</valuetype>
+        <group>profiling</group>
+        <definition>
+            <en>Whether to enable profiling or not</en>
+        </definition>
+        <description>
+            <en>The flag to determine whether Profiling Feature enable or not.
+    </en>
+        </description>
+    </property>
+    <briefsection>
+        <sectionname>directory</sectionname>
+        <name_en>Configuration</name_en>
+        <autoexpand>true</autoexpand>
+        <showdescription>false</showdescription>
+    </briefsection>
+    <briefsection>
+        <sectionname>advanced</sectionname>
+        <name_en>Advanced Configuration</name_en>
+        <autoexpand>true</autoexpand>
+        <showdescription>false</showdescription>
+    </briefsection>
+    <group>
+        <id>basic</id>
+        <name_en>Basic Configuration</name_en>
+        <description_en>Basic configurations that get HDFS running.</description_en>
+    </group>
+    <group>
+        <id>perf</id>
+        <name_en>Performance</name_en>
+        <description_en>Configurations that affect Hadoop's performance</description_en>
+    </group>
+    <group>
+        <id>jobtracker</id>
+        <name_en>Jobtracker Configuration</name_en>
+        <description_en>Configurations for Jobtracker.</description_en>
+    </group>
+    <group>
+        <id>tasktracker</id>
+        <name_en>Tasktracker Configuration</name_en>
+        <description_en>Configurations for Tasktracker.</description_en>
+    </group>
+    <group>
+        <id>map</id>
+        <name_en>Map Configuration</name_en>
+        <description_en>Configurations for Map job.</description_en>
+    </group>
+    <group>
+        <id>reduce</id>
+        <name_en>Reduce Configuration</name_en>
+        <description_en>Configurations for Reduce job.</description_en>
+    </group>
+    <group>
+        <id>io</id>
+        <name_en>IO Configuration</name_en>
+        <description_en>Configurations for Input/Output.</description_en>
+    </group>
+    <group>
+        <id>job</id>
+        <name_en>Job Configuration</name_en>
+        <description_en>Configurations for a job.</description_en>
+    </group>
+    <group>
+        <id>user</id>
+        <name_en>Configurations for user</name_en>
+        <description_en>Configurations for user.</description_en>
+    </group>
+    <group>
+        <id>scheduling</id>
+        <name_en>Configurations for scheduling</name_en>
+        <description_en>Configurations for scheduling.</description_en>
+    </group>
+    <group>
+        <id>profiling</id>
+        <name_en>Configurations for profiling</name_en>
+        <description_en>Configurations for profiling.</description_en>
+    </group>
+    <group>
+        <id>skip</id>
+        <name_en>Configurations for skip mode</name_en>
+        <description_en>Configurations for skip mode.</description_en>
+    </group>
+    <group>
+        <id>health</id>
+        <name_en>Configurations for health check</name_en>
+        <description_en>Configurations for health check.</description_en>
+    </group>
+</configuration>
diff --git a/savanna/tests/unit/plugins/intel/__init__.py b/savanna/tests/unit/plugins/intel/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/savanna/tests/unit/plugins/intel/client/__init__.py b/savanna/tests/unit/plugins/intel/client/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/savanna/tests/unit/plugins/intel/client/response.py b/savanna/tests/unit/plugins/intel/client/response.py
new file mode 100644
index 00000000..b2b867fa
--- /dev/null
+++ b/savanna/tests/unit/plugins/intel/client/response.py
@@ -0,0 +1,28 @@
+# Copyright (c) 2013 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import json
+
+
+class Response:
+    def __init__(self, data=None, ok=True, status_code=200):
+        self.text = json.dumps(data)
+        self.ok = ok
+        self.status_code = status_code
+        self.reason = None
+
+
+def make_resp(data=None, ok=True, status_code=200):
+    return Response(data, ok, status_code)
diff --git a/savanna/tests/unit/plugins/intel/client/test_client.py b/savanna/tests/unit/plugins/intel/client/test_client.py
new file mode 100644
index 00000000..7565bdb7
--- /dev/null
+++ b/savanna/tests/unit/plugins/intel/client/test_client.py
@@ -0,0 +1,310 @@
+# Copyright (c) 2013 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import mock
+
+from savanna import exceptions as ex
+from savanna.plugins.intel.client import client as c
+from savanna.plugins.intel import exceptions as iex
+from savanna.tests.unit import base
+from savanna.tests.unit.plugins.intel.client import response as r
+
+
+SESSION_POST_DATA = {'sessionID': '123'}
+SESSION_GET_DATA = {"items": [
+    {
+        "nodeprogress": {
+            "hostname": 'host',
+            'info': '_ALLFINISH\n'
+        }
+    }
+]}
+
+
+class TestClient(base.DbTestCase):
+
+    @mock.patch('requests.post')
+    @mock.patch('requests.get')
+    def test_cluster_op(self, get, post):
+        client = c.IntelClient('qwe', 'rty')
+
+        data = {'lelik': 'bolik'}
+
+        post.return_value = r.make_resp(data)
+        self.assertEqual(client.cluster.create(), data)
+
+        get.return_value = r.make_resp(data)
+        self.assertEqual(client.cluster.get(), data)
+
+        post.return_value = r.make_resp(SESSION_POST_DATA)
+        get.return_value = r.make_resp(SESSION_GET_DATA)
+        client.cluster.install_software(['bla-bla'])
+
+        self.assertEqual(post.call_count, 2)
+        self.assertEqual(get.call_count, 2)
+
+    @mock.patch('requests.delete')
+    @mock.patch('requests.post')
+    @mock.patch('requests.get')
+    def test_nodes_op(self, get, post, delete):
+        client = c.IntelClient('qwe', 'rty')
+
+        # add
+        post.return_value = r.make_resp(data={
+            "items": [
+                {
+                    "iporhostname": "n1",
+                    "info": "Connected"
+                },
+                {
+                    "iporhostname": "n2",
+                    "info": "Connected"
+                }
+            ]
+        })
+        client.nodes.add(['n1', 'n2'], 'hadoop', '/Def', '/tmp/key')
+        post.return_value = r.make_resp(data={
+            "items": [
+                {
+                    "iporhostname": "n1",
+                    "info": "bla-bla"
+                }
+            ]
+        })
+        self.assertRaises(iex.IntelPluginException, client.nodes.add,
+                          ['n1'], 'hadoop', '/Def', '/tmp/key')
+
+        # config
+        post.return_value = r.make_resp(SESSION_POST_DATA)
+        get.return_value = r.make_resp(SESSION_GET_DATA)
+        client.nodes.config()
+
+        # delete
+        delete.return_value = r.make_resp()
+        client.nodes.delete(['n1'])
+
+        # get
+        get.return_value = r.make_resp()
+        client.nodes.get()
+
+        # get_status
+        get.return_value = r.make_resp(data={"status": "running"})
+        client.nodes.get_status(['n1'])
+
+        # stop_nodes
+        post.return_value = r.make_resp()
+        client.nodes.stop(['n1'])
+
+        self.assertEqual(delete.call_count, 1)
+        self.assertEqual(post.call_count, 4)
+        self.assertEqual(get.call_count, 3)
+
+    @mock.patch('requests.put')
+    @mock.patch('requests.post')
+    def test_params_op(self, post, put):
+        client = c.IntelClient('qwe', 'rty')
+        post.return_value = r.make_resp()
+        put.return_value = r.make_resp()
+
+        # add
+        client.params.hdfs.add('lelik', 'bolik')
+        client.params.hadoop.add('lelik', 'bolik')
+        client.params.mapred.add('lelik', 'bolik')
+
+        # get
+        self.assertRaises(ex.NotImplementedException, client.params.hdfs.get,
+                          ['n1'], 'lelik')
+        self.assertRaises(ex.NotImplementedException, client.params.hadoop.get,
+                          ['n1'], 'lelik')
+        self.assertRaises(ex.NotImplementedException, client.params.mapred.get,
+                          ['n1'], 'lelik')
+
+        # update
+        client.params.hdfs.update('lelik', 'bolik', nodes=['n1'])
+        client.params.hdfs.update('lelik', 'bolik')
+        client.params.hadoop.update('lelik', 'bolik', nodes=['n1'])
+        client.params.hadoop.update('lelik', 'bolik')
+        client.params.mapred.update('lelik', 'bolik', nodes=['n1'])
+        client.params.mapred.update('lelik', 'bolik')
+
+        self.assertEqual(post.call_count, 3)
+        self.assertEqual(put.call_count, 6)
+
+    @mock.patch('savanna.context.sleep', lambda x: None)
+    @mock.patch('requests.post')
+    @mock.patch('requests.get')
+    def test_base_services_op(self, get, post):
+        client = c.IntelClient('qwe', 'rty')
+
+        # start
+        post.return_value = r.make_resp()
+        get.return_value = r.make_resp(data={
+            "items": [
+                {
+                    "serviceName": "hdfs",
+                    "status": "running"
+                },
+                {
+                    "serviceName": "mapred",
+                    "status": "running"
+                }
+            ]})
+        client.services.hdfs.start()
+        client.services.mapred.start()
+
+        get.return_value = r.make_resp(data={
+            "items": [
+                {
+                    "serviceName": "hdfs",
+                    "status": "stopped"
+                },
+                {
+                    "serviceName": "mapred",
+                    "status": "stopped"
+                }
+            ]
+        })
+
+        self.assertRaises(iex.IntelPluginException,
+                          client.services.hdfs.start)
+        self.assertRaises(iex.IntelPluginException,
+                          client.services.mapred.start)
+
+        # stop
+        post.return_value = r.make_resp()
+        client.services.hdfs.stop()
+        client.services.mapred.stop()
+
+        # service
+        get.return_value = r.make_resp(data={
+            "items": [
+                {
+                    "serviceName": "bla-bla",
+                    "status": "fail"
+                }
+            ]
+        })
+
+        self.assertRaises(iex.IntelPluginException,
+                          client.services.hdfs.status)
+        self.assertRaises(iex.IntelPluginException,
+                          client.services.mapred.status)
+
+        # get_nodes
+        get.return_value = r.make_resp()
+        client.services.hdfs.get_nodes()
+        client.services.mapred.get_nodes()
+
+        # add_nodes
+        post.return_value = r.make_resp()
+        client.services.hdfs.add_nodes('DataNode', ['n1', 'n2'])
+        client.services.mapred.add_nodes('NameNode', ['n1', 'n2'])
+
+        self.assertEqual(get.call_count, 126)
+        self.assertEqual(post.call_count, 8)
+
+    @mock.patch('requests.delete')
+    @mock.patch('requests.post')
+    @mock.patch('requests.get')
+    def test_services_op(self, get, post, delete):
+        client = c.IntelClient('qwe', 'rty')
+
+        # add
+        post.return_value = r.make_resp()
+        client.services.add(['hdfs', 'mapred'])
+
+        # get_services
+        get.return_value = r.make_resp()
+        client.services.get_services()
+
+        # delete_service
+        delete.return_value = r.make_resp()
+        client.services.delete_service('hdfs')
+
+    @mock.patch('requests.post')
+    @mock.patch('requests.get')
+    def test_hdfs_services_op(self, get, post):
+        client = c.IntelClient('qwe', 'rty')
+
+        # format
+        get.return_value = r.make_resp(SESSION_GET_DATA)
+        post.return_value = r.make_resp(SESSION_POST_DATA)
+        client.services.hdfs.format()
+
+        # decommission
+        post.return_value = r.make_resp()
+        client.services.hdfs.decommission_nodes(['n1'])
+
+        # get status
+        get.return_value = r.make_resp(data={
+            "items": [
+                {
+                    "hostname": "n1",
+                    "status": "start"
+                }
+            ]
+        })
+        client.services.hdfs.get_datanodes_status()
+        self.assertEqual(client.services.hdfs.get_datanode_status('n1'),
+                         'start')
+        self.assertRaises(iex.IntelPluginException,
+                          client.services.hdfs.get_datanode_status, 'n2')
+
+        self.assertEqual(get.call_count, 4)
+        self.assertEqual(post.call_count, 2)
+
+    @mock.patch('savanna.context.sleep', lambda x: None)
+    @mock.patch('requests.post')
+    @mock.patch('requests.get')
+    def test_session_op(self, get, post):
+        client = c.IntelClient('qwe', 'rty')
+
+        data1 = {
+            "items": [
+                {
+                    "nodeprogress": {
+                        "hostname": 'host',
+                        'info': 'info\n'
+                    }
+                }
+            ]
+        }
+        data2 = {
+            "items": [
+                {
+                    "nodeprogress": {
+                        "hostname": 'host',
+                        'info': '_ALLFINISH\n'
+                    }
+                }
+            ]
+        }
+
+        get.side_effect = (r.make_resp(data1), r.make_resp(data2))
+        post.return_value = r.make_resp(SESSION_POST_DATA)
+
+        client.services.hdfs.format()
+
+        self.assertEqual(get.call_count, 2)
+        self.assertEqual(post.call_count, 1)
+
+    @mock.patch('requests.get')
+    def test_rest_client(self, get):
+        client = c.IntelClient('qwe', 'rty')
+        get.return_value = r.make_resp(ok=False, status_code=500, data={
+            "message": "message"
+        })
+        self.assertRaises(iex.IntelPluginException,
+                          client.services.get_services)
diff --git a/savanna/tests/unit/plugins/intel/test_plugin.py b/savanna/tests/unit/plugins/intel/test_plugin.py
new file mode 100644
index 00000000..0fe46a19
--- /dev/null
+++ b/savanna/tests/unit/plugins/intel/test_plugin.py
@@ -0,0 +1,61 @@
+# Copyright (c) 2013 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from savanna.plugins.general import exceptions as g_ex
+from savanna.plugins.intel import config_helper as c_helper
+from savanna.plugins.intel import exceptions as i_ex
+from savanna.plugins.intel import plugin as p
+from savanna.tests.unit import base
+from savanna.tests.unit.plugins.intel import test_utils as tu
+
+
+class TestIDHPlugin(base.DbTestCase):
+    def test_get_configs(self):
+        plugin = p.IDHProvider()
+        configs = plugin.get_configs('2.5.0')
+
+        self.assertIn(c_helper.IDH_REPO_URL, configs)
+        self.assertIn(c_helper.IDH_TARBALL_URL, configs)
+        self.assertIn(c_helper.OS_REPO_URL, configs)
+
+    def test_validate(self):
+        plugin = p.IDHProvider()
+
+        ng_mng = tu.make_ng_dict('mng', 'f1', ['manager'], 1)
+        ng_nn = tu.make_ng_dict('nn', 'f1', ['namenode'], 1)
+        ng_jt = tu.make_ng_dict('jt', 'f1', ['jobtracker'], 1)
+        ng_dn = tu.make_ng_dict('dn', 'f1', ['datanode'], 2)
+        ng_tt = tu.make_ng_dict('tt', 'f1', ['tasktracker'], 2)
+
+        cl = tu.create_cluster('cl1', 't1', 'intel', '2.5.0',
+                               [ng_nn] + [ng_dn])
+        self.assertRaises(i_ex.NotSingleManagerException, plugin.validate, cl)
+
+        cl = tu.create_cluster('cl1', 't1', 'intel', '2.5.0', [ng_mng])
+        self.assertRaises(g_ex.NotSingleNameNodeException, plugin.validate, cl)
+
+        cl = tu.create_cluster('cl1', 't1', 'intel', '2.5.0',
+                               [ng_mng] + [ng_nn] * 2)
+        self.assertRaises(g_ex.NotSingleNameNodeException, plugin.validate, cl)
+
+        cl = tu.create_cluster('cl1', 't1', 'intel', '2.5.0',
+                               [ng_mng] + [ng_nn] + [ng_tt])
+        self.assertRaises(g_ex.TaskTrackersWithoutJobTracker,
+                          plugin.validate, cl)
+
+        cl = tu.create_cluster('cl1', 't1', 'intel', '2.5.0',
+                               [ng_mng] + [ng_nn] + [ng_jt] * 2 + [ng_tt])
+        self.assertRaises(g_ex.NotSingleJobTrackerException,
+                          plugin.validate, cl)
diff --git a/savanna/tests/unit/plugins/intel/test_utils.py b/savanna/tests/unit/plugins/intel/test_utils.py
new file mode 100644
index 00000000..04cb0c6d
--- /dev/null
+++ b/savanna/tests/unit/plugins/intel/test_utils.py
@@ -0,0 +1,32 @@
+# Copyright (c) 2013 Intel Corporation
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+# implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+from savanna.conductor import resource as r
+
+
+def create_cluster(name, tenant, plugin, version, node_groups, **kwargs):
+    dct = {'name': name, 'tenant_id': tenant, 'plugin_name': plugin,
+           'hadoop_version': version, 'node_groups': node_groups}
+    dct.update(kwargs)
+    return r.ClusterResource(dct)
+
+
+def make_ng_dict(name, flavor, processes, count, instances=[]):
+    return {'name': name, 'flavor_id': flavor, 'node_processes': processes,
+            'count': count, 'instances': instances}
+
+
+def make_inst_dict(inst_id, inst_name):
+    return {'instance_id': inst_id, 'instance_name': inst_name}
diff --git a/savanna/tests/unit/resources/test-default-with-type-and-locale.xml b/savanna/tests/unit/resources/test-default-with-type-and-locale.xml
new file mode 100644
index 00000000..c4b86fb8
--- /dev/null
+++ b/savanna/tests/unit/resources/test-default-with-type-and-locale.xml
@@ -0,0 +1,43 @@
+<?xml version="1.0"?>
+<configuration>
+    <!--Common hadoop property-->
+    <property>
+      <name>name1</name>
+      <value>value1</value>
+      <valuetype>String</valuetype>
+      <description>
+        <en>descr1</en>
+      </description>
+    </property>
+    <!--Common hadoop property without 'valuetype' tag-->
+    <property>
+      <name>name2</name>
+      <value>value2</value>
+      <description>
+        <en>descr2</en>
+      </description>
+    </property>
+    <!--Common hadoop property 3 without text in 'value' tag-->
+    <property>
+      <name>name3</name>
+      <value></value>
+      <valuetype>String</valuetype>
+      <description>
+          <en>descr3</en>
+      </description>
+    </property>
+    <!--Common hadoop property 4 without 'value' tag-->
+    <property>
+        <name>name4</name>
+        <valuetype>String</valuetype>
+        <description>
+            <en>descr4</en>
+        </description>
+    </property>
+    <!--Common hadoop property 5 without description-->
+    <property>
+        <name>name5</name>
+        <value>value5</value>
+        <valuetype>String</valuetype>
+    </property>
+</configuration>
diff --git a/savanna/tests/unit/utils/test_xml_utils.py b/savanna/tests/unit/utils/test_xml_utils.py
index 2b3b8202..5611cdba 100644
--- a/savanna/tests/unit/utils/test_xml_utils.py
+++ b/savanna/tests/unit/utils/test_xml_utils.py
@@ -36,6 +36,24 @@ class XMLUtilsTestCase(unittest2.TestCase):
             x.load_hadoop_xml_defaults(
                 'tests/unit/resources/test-default.xml'))
 
+    def test_load_xml_defaults_with_type_and_locale(self):
+        expected = [
+            {'name': u'name1', 'value': u'value1', 'type': u'String',
+             'description': 'descr1'},
+            {'name': u'name2', 'value': u'value2', 'type': u'',
+             'description': 'descr2'},
+            {'name': u'name3', 'value': '', 'type': u'String',
+             'description': 'descr3'},
+            {'name': u'name4', 'value': '', 'type': u'String',
+             'description': 'descr4'},
+            {'name': u'name5', 'value': u'value5', 'type': u'String',
+             'description': ''}]
+        actual = x.load_hadoop_xml_defaults_with_type_and_locale(
+            'tests/unit/resources/test-default-with-type-and-locale.xml')
+        self.assertListEqual(
+            expected,
+            actual)
+
     def test_adjust_description(self):
         self.assertEqual(x._adjust_field("\n"), "")
         self.assertEqual(x._adjust_field("\n  "), "")
diff --git a/savanna/utils/xmlutils.py b/savanna/utils/xmlutils.py
index 95306422..7e2464cf 100644
--- a/savanna/utils/xmlutils.py
+++ b/savanna/utils/xmlutils.py
@@ -36,6 +36,27 @@ def load_hadoop_xml_defaults(file_name):
     return configs
 
 
+def load_hadoop_xml_defaults_with_type_and_locale(file_name):
+    doc = load_xml_document(file_name)
+    configs = []
+    prop = doc.getElementsByTagName('property')
+    for elements in prop:
+        configs.append({
+            'name': _get_text_from_node(elements, 'name'),
+            'value': _get_text_from_node(elements, 'value'),
+            'type': _get_text_from_node(elements, 'valuetype'),
+            'description': _adjust_field(
+                _get_text_from_node(
+                    _get_node_element(elements, 'description'), 'en'))
+        })
+    return configs
+
+
+def _get_node_element(element, name):
+    element = element.getElementsByTagName(name)
+    return element[0] if element and element[0].hasChildNodes() else None
+
+
 def create_hadoop_xml(configs, config_filter=None):
     doc = xml.Document()
 
@@ -68,7 +89,7 @@ def load_xml_document(file_name):
 
 
 def _get_text_from_node(element, name):
-    element = element.getElementsByTagName(name)
+    element = element.getElementsByTagName(name) if element else None
     return element[0].firstChild.nodeValue if (
         element and element[0].hasChildNodes()) else ''
 
diff --git a/setup.cfg b/setup.cfg
index 64b96a35..e5cffc29 100644
--- a/setup.cfg
+++ b/setup.cfg
@@ -36,6 +36,7 @@ console_scripts =
 savanna.cluster.plugins =
     vanilla = savanna.plugins.vanilla.plugin:VanillaProvider
     hdp = savanna.plugins.hdp.ambariplugin:AmbariPlugin
+    idh = savanna.plugins.intel.plugin:IDHProvider
 
 savanna.infrastructure.engine =
     savanna = savanna.service.instances:SavannaInfrastructureEngine