Hi,

I found the link after hours of going through Google search results...

My hadoop-metrics looks like this:

dfs.class=org.apache.hadoop.metrics.ganglia.GangliaContext
dfs.period=10
dfs.servers=localhost:8649

mapred.class=org.apache.hadoop.metrics.ganglia.GangliaContext
mapred.period=10
mapred.servers=localhost:8649

jvm.class=org.apache.hadoop.metrics.ganglia.GangliaContext
jvm.period=10
jvm.servers=localhost:8649

I use localhost because gmond runs on that machine.
gmond xml output is attached.


Thanks,
Tamir


On Tue, Mar 17, 2009 at 3:55 PM, Brian Bockelman <bbock...@cse.unl.edu>wrote:

> Hey Tamir,
>
> I assume you want something like this:
>
>
> http://rcf.unl.edu/ganglia/?c=red-workers&h=node155&m=load_one&r=hour&s=descending&hc=4
>
> (That link's old - where'd you find it?  I'll update it...)
>
> Can you send out the relevant lines from the hadoop-metrics file?
>
> Also, can you do the following
>
> telnet (Ganglia host) (Ganglia port)
>
> This should spew out lots of XML data; use the host and port you configured
> hadoop with.
>
> Brian
>
>
> On Mar 17, 2009, at 8:48 AM, Tamir Kamara wrote:
>
>  Hi,
>>
>> For a few days I'm trying to make hadoop work with the Ganglia monitoring
>> software.
>> I'm using hadoop 0.18.3 with ganglia 3.0.6, I've changed the
>> hadoop-metrics
>> file as described in the wiki and also used HADOOP-3422 patch.Now, I can
>> only see system metrics in the ganglia data and nothing about hadoop
>> itself.
>>
>> I also tried to add a collection group to gmond.conf for metric
>> mapred.tasktracker.mapTaskSlots, but that caused gmond to stop working
>> because it couldn't "collect the metric on the platform" which means that
>> it
>> doesn't recognize the metric.
>> It should be possible to do this like in
>> http://rcf.unl.edu/ganglia/?c=red.
>>
>> There're some posts of this issue but I couldn't find any answer or
>> detailed
>> description of how to monitor hadoop with ganglia.
>>
>> Does anyone have any experience with this ?
>>
>> Thanks,
>> Tamir
>>
>
>
Trying 127.0.0.1...
Connected to localhost.
Escape character is '^]'.
<?xml version="1.0" encoding="ISO-8859-1" standalone="yes"?>
<!DOCTYPE GANGLIA_XML [
   <!ELEMENT GANGLIA_XML (GRID|CLUSTER|HOST)*>
      <!ATTLIST GANGLIA_XML VERSION CDATA #REQUIRED>
      <!ATTLIST GANGLIA_XML SOURCE CDATA #REQUIRED>
   <!ELEMENT GRID (CLUSTER | GRID | HOSTS | METRICS)*>
      <!ATTLIST GRID NAME CDATA #REQUIRED>
      <!ATTLIST GRID AUTHORITY CDATA #REQUIRED>
      <!ATTLIST GRID LOCALTIME CDATA #IMPLIED>
   <!ELEMENT CLUSTER (HOST | HOSTS | METRICS)*>
      <!ATTLIST CLUSTER NAME CDATA #REQUIRED>
      <!ATTLIST CLUSTER OWNER CDATA #IMPLIED>
      <!ATTLIST CLUSTER LATLONG CDATA #IMPLIED>
      <!ATTLIST CLUSTER URL CDATA #IMPLIED>
      <!ATTLIST CLUSTER LOCALTIME CDATA #REQUIRED>
   <!ELEMENT HOST (METRIC)*>
      <!ATTLIST HOST NAME CDATA #REQUIRED>
      <!ATTLIST HOST IP CDATA #REQUIRED>
      <!ATTLIST HOST LOCATION CDATA #IMPLIED>
      <!ATTLIST HOST REPORTED CDATA #REQUIRED>
      <!ATTLIST HOST TN CDATA #IMPLIED>
      <!ATTLIST HOST TMAX CDATA #IMPLIED>
      <!ATTLIST HOST DMAX CDATA #IMPLIED>
      <!ATTLIST HOST GMOND_STARTED CDATA #IMPLIED>
   <!ELEMENT METRIC EMPTY>
      <!ATTLIST METRIC NAME CDATA #REQUIRED>
      <!ATTLIST METRIC VAL CDATA #REQUIRED>
      <!ATTLIST METRIC TYPE (string | int8 | uint8 | int16 | uint16 | int32 | 
uint32 | float | double | timestamp) #REQUIRED>
      <!ATTLIST METRIC UNITS CDATA #IMPLIED>
      <!ATTLIST METRIC TN CDATA #IMPLIED>
      <!ATTLIST METRIC TMAX CDATA #IMPLIED>
      <!ATTLIST METRIC DMAX CDATA #IMPLIED>
      <!ATTLIST METRIC SLOPE (zero | positive | negative | both | unspecified) 
#IMPLIED>
      <!ATTLIST METRIC SOURCE (gmond | gmetric) #REQUIRED>
   <!ELEMENT HOSTS EMPTY>
      <!ATTLIST HOSTS UP CDATA #REQUIRED>
      <!ATTLIST HOSTS DOWN CDATA #REQUIRED>
      <!ATTLIST HOSTS SOURCE (gmond | gmetric | gmetad) #REQUIRED>
   <!ELEMENT METRICS EMPTY>
      <!ATTLIST METRICS NAME CDATA #REQUIRED>
      <!ATTLIST METRICS SUM CDATA #REQUIRED>
      <!ATTLIST METRICS NUM CDATA #REQUIRED>
      <!ATTLIST METRICS TYPE (string | int8 | uint8 | int16 | uint16 | int32 | 
uint32 | float | double | timestamp) #REQUIRED>
      <!ATTLIST METRICS UNITS CDATA #IMPLIED>
      <!ATTLIST METRICS SLOPE (zero | positive | negative | both | unspecified) 
#IMPLIED>
      <!ATTLIST METRICS SOURCE (gmond | gmetric) #REQUIRED>
]>
<GANGLIA_XML VERSION="3.0.6" SOURCE="gmond">
<CLUSTER NAME="Hadoop" LOCALTIME="1237299222" OWNER="unspecified" 
LATLONG="unspecified" URL="unspecified">
<HOST NAME="lb-fds-42.site" IP="192.168.12.6" REPORTED="1237299213" TN="9" 
TMAX="20" DMAX="0" LOCATION="unspecified" GMOND_STARTED="1237297653">
<METRIC NAME="disk_total" VAL="144.736" TYPE="double" UNITS="GB" TN="1565" 
TMAX="1200" DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="cpu_speed" VAL="2393" TYPE="uint32" UNITS="MHz" TN="365" 
TMAX="1200" DMAX="0" SLOPE="zero" SOURCE="gmond"/>
<METRIC NAME="part_max_used" VAL="17.7" TYPE="float" UNITS="%" TN="125" 
TMAX="180" DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="swap_total" VAL="2008084" TYPE="uint32" UNITS="KB" TN="365" 
TMAX="1200" DMAX="0" SLOPE="zero" SOURCE="gmond"/>
<METRIC NAME="os_name" VAL="Linux" TYPE="string" UNITS="" TN="365" TMAX="1200" 
DMAX="0" SLOPE="zero" SOURCE="gmond"/>
<METRIC NAME="cpu_user" VAL="0.0" TYPE="float" UNITS="%" TN="35" TMAX="90" 
DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="cpu_system" VAL="0.1" TYPE="float" UNITS="%" TN="35" TMAX="90" 
DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="cpu_aidle" VAL="98.8" TYPE="float" UNITS="%" TN="35" TMAX="3800" 
DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="load_five" VAL="1.71" TYPE="float" UNITS=" " TN="35" TMAX="325" 
DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="proc_run" VAL="0" TYPE="uint32" UNITS=" " TN="125" TMAX="950" 
DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="mem_free" VAL="7276988" TYPE="uint32" UNITS="KB" TN="5" 
TMAX="180" DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="mem_buffers" VAL="49316" TYPE="uint32" UNITS="KB" TN="5" 
TMAX="180" DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="swap_free" VAL="2008084" TYPE="uint32" UNITS="KB" TN="5" 
TMAX="180" DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="bytes_in" VAL="186.88" TYPE="float" UNITS="bytes/sec" TN="65" 
TMAX="300" DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="pkts_out" VAL="2.58" TYPE="float" UNITS="packets/sec" TN="65" 
TMAX="300" DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="cpu_num" VAL="4" TYPE="uint16" UNITS="CPUs" TN="365" TMAX="1200" 
DMAX="0" SLOPE="zero" SOURCE="gmond"/>
<METRIC NAME="disk_free" VAL="119.523" TYPE="double" UNITS="GB" TN="125" 
TMAX="180" DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="mem_total" VAL="8062032" TYPE="uint32" UNITS="KB" TN="365" 
TMAX="1200" DMAX="0" SLOPE="zero" SOURCE="gmond"/>
<METRIC NAME="cpu_wio" VAL="0.0" TYPE="float" UNITS="%" TN="35" TMAX="90" 
DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="boottime" VAL="1237294446" TYPE="uint32" UNITS="s" TN="365" 
TMAX="1200" DMAX="0" SLOPE="zero" SOURCE="gmond"/>
<METRIC NAME="machine_type" VAL="x86_64" TYPE="string" UNITS="" TN="365" 
TMAX="1200" DMAX="0" SLOPE="zero" SOURCE="gmond"/>
<METRIC NAME="os_release" VAL="2.6.16.60-0.21-smp" TYPE="string" UNITS="" 
TN="365" TMAX="1200" DMAX="0" SLOPE="zero" SOURCE="gmond"/>
<METRIC NAME="cpu_nice" VAL="0.0" TYPE="float" UNITS="%" TN="35" TMAX="90" 
DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="cpu_idle" VAL="99.8" TYPE="float" UNITS="%" TN="35" TMAX="90" 
DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="load_one" VAL="1.62" TYPE="float" UNITS=" " TN="35" TMAX="70" 
DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="load_fifteen" VAL="1.72" TYPE="float" UNITS=" " TN="35" 
TMAX="950" DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="proc_total" VAL="196" TYPE="uint32" UNITS=" " TN="125" TMAX="950" 
DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="mem_shared" VAL="0" TYPE="uint32" UNITS="KB" TN="5" TMAX="180" 
DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="mem_cached" VAL="501692" TYPE="uint32" UNITS="KB" TN="5" 
TMAX="180" DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="gexec" VAL="OFF" TYPE="string" UNITS="" TN="65" TMAX="300" 
DMAX="0" SLOPE="zero" SOURCE="gmond"/>
<METRIC NAME="bytes_out" VAL="349.38" TYPE="float" UNITS="bytes/sec" TN="65" 
TMAX="300" DMAX="0" SLOPE="both" SOURCE="gmond"/>
<METRIC NAME="pkts_in" VAL="1.45" TYPE="float" UNITS="packets/sec" TN="65" 
TMAX="300" DMAX="0" SLOPE="both" SOURCE="gmond"/>
</HOST>
</CLUSTER>
</GANGLIA_XML>

Reply via email to