[ 
https://issues.apache.org/jira/browse/SPARK-17877?page=com.atlassian.jira.plugin.system.issuetabpanels:all-tabpanel
 ]

Alexander Pivovarov updated SPARK-17877:
----------------------------------------
    Description: 
The following code demonstrates the issue
{code}
import org.apache.spark.graphx._
val users = sc.parallelize(List((3L, ("lucas", "student")), (7L, ("john", 
"postdoc")), (5L, ("matt", "prof")), (2L, ("kelly", "prof"))))
val rel = sc.parallelize(List(Edge(3L, 7L, "collab"), Edge(5L, 3L, "advisor"), 
Edge(2L, 5L, "colleague"), Edge(5L, 7L, "pi")))
sc.setCheckpointDir("/tmp/check")

val g = Graph(users, rel)
g.checkpoint

val gg = g.connectedComponents()
gg.checkpoint

gg.vertices.collect
gg.edges.collect
gg.isCheckpointed
// res5: Boolean = false
{code}
I think the last line should return true instead of false

  was:
The following code demonstrates an issue
{code}
import org.apache.spark.graphx._
val users = sc.parallelize(List((3L, ("lucas", "student")), (7L, ("john", 
"postdoc")), (5L, ("matt", "prof")), (2L, ("kelly", "prof"))))
val rel = sc.parallelize(List(Edge(3L, 7L, "collab"), Edge(5L, 3L, "advisor"), 
Edge(2L, 5L, "colleague"), Edge(5L, 7L, "pi")))
sc.setCheckpointDir("/tmp/check")

val g = Graph(users, rel)
g.checkpoint

val gg = g.connectedComponents()
gg.checkpoint

gg.vertices.collect
gg.edges.collect
gg.isCheckpointed
// res5: Boolean = false
{code}
I think the last line should return true instead of false


> Can not checkpoint connectedComponents resulting graph
> ------------------------------------------------------
>
>                 Key: SPARK-17877
>                 URL: https://issues.apache.org/jira/browse/SPARK-17877
>             Project: Spark
>          Issue Type: Bug
>          Components: GraphX
>    Affects Versions: 1.5.2, 1.6.2, 2.0.1
>            Reporter: Alexander Pivovarov
>            Priority: Minor
>
> The following code demonstrates the issue
> {code}
> import org.apache.spark.graphx._
> val users = sc.parallelize(List((3L, ("lucas", "student")), (7L, ("john", 
> "postdoc")), (5L, ("matt", "prof")), (2L, ("kelly", "prof"))))
> val rel = sc.parallelize(List(Edge(3L, 7L, "collab"), Edge(5L, 3L, 
> "advisor"), Edge(2L, 5L, "colleague"), Edge(5L, 7L, "pi")))
> sc.setCheckpointDir("/tmp/check")
> val g = Graph(users, rel)
> g.checkpoint
> val gg = g.connectedComponents()
> gg.checkpoint
> gg.vertices.collect
> gg.edges.collect
> gg.isCheckpointed
> // res5: Boolean = false
> {code}
> I think the last line should return true instead of false



--
This message was sent by Atlassian JIRA
(v6.3.4#6332)

---------------------------------------------------------------------
To unsubscribe, e-mail: issues-unsubscr...@spark.apache.org
For additional commands, e-mail: issues-h...@spark.apache.org

Reply via email to