hadoop-client properties
Panagiotis Liakos
p.liakos at di.uoa.gr
Mon Apr 11 13:30:10 UTC 2016
Hi all,
I am trying to setup a cluster with juju in the local environment to
submit jobs with Apache Giraph. You can find the details of my setup
at the end of this e-mail.
I have downloaded and build Apache Giraph on my hadoop-client and I
want to try some examples that execute on two workers.
After a number of failed attempts I found out that I have to set
property: ''mapreduce.jobtracker.address' (or the deprecated
'mapred.job.tracker') to 'yarn' in order to run giraph with > 1
workers.
In particular, Giraph considered that this property was set to 'local'.
At first I found out that I can set a custom attribute with:
-ca giraph.SplitMasterWorker=false
to execute my job with one worker.
Then, after finding the code responsible for this
behavior(https://github.com/apache/giraph/blob/7e48523b520afee8e727d1e1aaab801a3bd80f06/giraph-core/src/main/java/org/apache/giraph/job/GiraphJob.java#L143)
I was able to set the correct hadoop property and execute my job with
2 workers.
My question is, why is this property not set in the juju client charm?
Does it enable some otherwise undesired behavior?
I see that 'mapreduce.framework.name' is set to 'yarn' but apparently
this is not enough for giraph.
Thank you.
--Panagiotis Liakos
My environment:
environment: local
machines:
"0":
agent-state: started
agent-version: 1.25.3.1
dns-name: localhost
instance-id: localhost
series: trusty
state-server-member-status: has-vote
"1":
agent-state: started
agent-version: 1.25.3.1
dns-name: 10.0.3.78
instance-id: panagiotis-local-machine-1
series: trusty
hardware: arch=amd64
"2":
agent-state: started
agent-version: 1.25.3.1
dns-name: 10.0.3.178
instance-id: panagiotis-local-machine-2
series: trusty
hardware: arch=amd64
"3":
agent-state: started
agent-version: 1.25.3.1
dns-name: 10.0.3.182
instance-id: panagiotis-local-machine-3
series: trusty
hardware: arch=amd64
"4":
agent-state: started
agent-version: 1.25.3.1
dns-name: 10.0.3.179
instance-id: panagiotis-local-machine-4
series: trusty
hardware: arch=amd64
"5":
agent-state: started
agent-version: 1.25.3.1
dns-name: 10.0.3.183
instance-id: panagiotis-local-machine-5
series: trusty
hardware: arch=amd64
services:
client:
charm: cs:trusty/hadoop-client-1
exposed: false
service-status:
current: active
message: Ready
since: 10 Apr 2016 08:08:20+03:00
relations:
hadoop:
- plugin
units:
client/0:
workload-status:
current: active
message: Ready
since: 10 Apr 2016 08:08:20+03:00
agent-status:
current: idle
since: 10 Apr 2016 08:08:23+03:00
version: 1.25.3.1
agent-state: started
agent-version: 1.25.3.1
machine: "5"
public-address: 10.0.3.183
subordinates:
plugin/0:
workload-status:
current: active
message: Ready (HDFS & YARN)
since: 10 Apr 2016 08:08:01+03:00
agent-status:
current: idle
since: 10 Apr 2016 08:08:03+03:00
version: 1.25.3.1
agent-state: started
agent-version: 1.25.3.1
upgrading-from: cs:trusty/apache-hadoop-plugin-13
public-address: 10.0.3.183
namenode:
charm: cs:trusty/apache-hadoop-namenode-1
exposed: false
service-status:
current: active
message: Ready (2 DataNodes)
since: 10 Apr 2016 08:04:33+03:00
relations:
datanode:
- slave
namenode:
- plugin
- resourcemgr
units:
namenode/0:
workload-status:
current: active
message: Ready (2 DataNodes)
since: 10 Apr 2016 08:04:33+03:00
agent-status:
current: idle
since: 10 Apr 2016 08:04:36+03:00
version: 1.25.3.1
agent-state: started
agent-version: 1.25.3.1
machine: "1"
open-ports:
- 50070/tcp
public-address: 10.0.3.78
plugin:
charm: cs:trusty/apache-hadoop-plugin-13
exposed: false
service-status: {}
relations:
hadoop-plugin:
- client
namenode:
- namenode
resourcemanager:
- resourcemgr
subordinate-to:
- client
resourcemgr:
charm: cs:trusty/apache-hadoop-resourcemanager-1
exposed: false
service-status:
current: active
message: Ready (2 NodeManagers)
since: 10 Apr 2016 08:07:54+03:00
relations:
namenode:
- namenode
nodemanager:
- slave
resourcemanager:
- plugin
units:
resourcemgr/0:
workload-status:
current: active
message: Ready (2 NodeManagers)
since: 10 Apr 2016 08:07:54+03:00
agent-status:
current: idle
since: 10 Apr 2016 08:07:57+03:00
version: 1.25.3.1
agent-state: started
agent-version: 1.25.3.1
machine: "2"
open-ports:
- 8088/tcp
- 19888/tcp
public-address: 10.0.3.178
slave:
charm: cs:trusty/apache-hadoop-slave-1
exposed: false
service-status:
current: active
message: Ready (DataNode & NodeManager)
since: 10 Apr 2016 08:08:00+03:00
relations:
namenode:
- namenode
resourcemanager:
- resourcemgr
units:
slave/0:
workload-status:
current: active
message: Ready (DataNode & NodeManager)
since: 10 Apr 2016 08:08:00+03:00
agent-status:
current: idle
since: 10 Apr 2016 08:08:03+03:00
version: 1.25.3.1
agent-state: started
agent-version: 1.25.3.1
machine: "3"
open-ports:
- 8042/tcp
- 50075/tcp
public-address: 10.0.3.182
slave/1:
workload-status:
current: active
message: Ready (DataNode & NodeManager)
since: 10 Apr 2016 08:08:30+03:00
agent-status:
current: idle
since: 10 Apr 2016 08:08:33+03:00
version: 1.25.3.1
agent-state: started
agent-version: 1.25.3.1
machine: "4"
open-ports:
- 8042/tcp
- 50075/tcp
public-address: 10.0.3.179
More information about the Juju
mailing list