[ 
https://issues.apache.org/jira/browse/TEZ-2076?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=14335484#comment-14335484
 ] 

Gopal V commented on TEZ-2076:
------------------------------

{code}
scala> import java.io._;
import java.io._

scala> import org.apache.tez.history.parser._;
import org.apache.tez.history.parser._

scala> val p = new ATSFileParser(new File("dag_1421164610335_0820_1.zip")) 
p: org.apache.tez.history.parser.ATSFileParser = 
org.apache.tez.history.parser.ATSFileParser@25d0cb3a

scala> val d = p.getDAGData("dag_1421164610335_0820_1")
d: org.apache.tez.history.parser.DagInfo = [dagID=dag_1421164610335_0820_1, 
dagName=rajesh_20150210175454_bec56061-02d6-4730-bdf6-89a455625a0f:1, 
status=SUCCEEDED, startTime=0, submitTime=-1423619702215, endTime=1010246, 
timeTaken=1010246, diagnostics=, vertexNameIDMapping={Map 
2=vertex_1421164610335_0820_1_03, Reducer 3=vertex_1421164610335_0820_1_04, Map 
1=vertex_1421164610335_0820_1_02, Map 4=vertex_1421164610335_0820_1_01, Map 
5=vertex_1421164610335_0820_1_00}, failedTasks=0, events=[], status=SUCCEEDED]

scala> println(d.getTimeTaken())
1010246
scala> d.getFailedTasks()
res6: Int = 0

scala> d.getContainersToTaskAttemptMapping()
res7: 
com.google.common.collect.Multimap[org.apache.tez.history.parser.Container,org.apache.tez.history.parser.TaskAttemptInfo]
 = {[id=container_1421164610335_0820_01_000074, 
host=cn053-10.l42scl.hortonworks.com]=[[taskAttemptId=attempt_1421164610335_0820_1_03_000106_0,
 scheduledTime=0, startTime=1423619705486, finishTime=1423620148368, 
timeTaken=442882, events=[[info={}, type=TASK_ATTEMPT_FINISHED, 
time=1423620148368], [info={}, type=TASK_ATTEMPT_STARTED, time=1423619705486]], 
diagnostics=, successfulAttempId=, 
container=[id=container_1421164610335_0820_01_000074, 
host=cn053-10.l42scl.hortonworks.com], nodeId=cn053-10.l42scl.hortonworks.com, 
logURL=http://cn042-10.l42scl.hortonworks.com:19888/jobhistory/logs/cn053-10.l42scl.hortonworks.com:43277/container_1421164610335_0820_01_000074/v...
{code}

> Tez framework to extract/analyze data stored in ATS for specific dag
> --------------------------------------------------------------------
>
>                 Key: TEZ-2076
>                 URL: https://issues.apache.org/jira/browse/TEZ-2076
>             Project: Apache Tez
>          Issue Type: Improvement
>            Reporter: Rajesh Balamohan
>            Assignee: Rajesh Balamohan
>         Attachments: TEZ-2076.WIP.2.patch, TEZ-2076.WIP.3.patch, 
> TEZ-2076.WIP.patch
>
>
> - Users should be able to download ATS data pertaining to a DAG from Tez-UI 
> (more like a zip file containing DAG/Vertex/Task/TaskAttempt info).
> - This can be plugged to an analyzer which parses the data, adds semantics 
> and provides an in-memory representation for further analysis.
> - This will enable to write different analyzer rules, which can be run on top 
> of this in-memory representation to come up with analysis on the DAG.
> - Results of this analyzer rules can be rendered on to UI (standalone webapp) 
> later point in time.



--
This message was sent by Atlassian JIRA
(v6.3.4#6332)

Reply via email to