[ https://issues.apache.org/jira/browse/GIRAPH-1188?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=16444798#comment-16444798 ]
ASF GitHub Bot commented on GIRAPH-1188: ---------------------------------------- Github user yukselakinci commented on a diff in the pull request: https://github.com/apache/giraph/pull/70#discussion_r182885119 --- Diff: giraph-core/src/main/java/org/apache/giraph/writable/kryo/GiraphClassResolver.java --- @@ -0,0 +1,308 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ +package org.apache.giraph.writable.kryo; +import com.esotericsoftware.kryo.Kryo; +import com.esotericsoftware.kryo.KryoException; +import com.esotericsoftware.kryo.Registration; +import com.esotericsoftware.kryo.io.Input; +import com.esotericsoftware.kryo.io.Output; +import com.esotericsoftware.kryo.util.DefaultClassResolver; +import com.esotericsoftware.kryo.util.ObjectMap; +import org.apache.giraph.zk.ZooKeeperExt; +import org.apache.zookeeper.CreateMode; +import org.apache.zookeeper.KeeperException; +import org.apache.zookeeper.ZooDefs; +import java.util.HashMap; +import java.util.Map; +import java.util.List; + +import static com.esotericsoftware.kryo.util.Util.getWrapperClass; + +/** + * This class resolver assigns unique classIds for every class that was not + * explicitly registered. It uses zookeeper for consistent mapping across all + * nodes. + */ +public class GiraphClassResolver extends DefaultClassResolver { + /** Length of the ZK sequence number */ + private static final int SEQUENCE_NUMBER_LENGTH = 10; + /** Base ID to start for class name assignments. + * This number has to be high enough to not conflict with + * explicity registered class IDs. + * */ + private static final int BASE_CLASS_ID = 10000; + + /** Class name to ID cache */ + private static Map<String, Integer> CLASS_NAME_TO_ID = new HashMap(); + /** ID to class name cache */ + private static Map<Integer, String> ID_TO_CLASS_NAME = new HashMap(); + /** Zookeeper */ + private static ZooKeeperExt ZK; + /** Zookeeper path for automatic class registrations */ + private static String KRYO_REGISTERED_CLASS_PATH; + /** Minimum class ID assigned by zookeeper sequencing */ + private static int MIN_CLASS_ID = -1; + + /** Memoized class id*/ + private int memoizedClassId = -1; + /** Memoized class registration */ + private Registration memoizedClassIdValue; + + /** + * Sets zookeeper informaton. + * @param zookeeperExt ZookeeperExt + * @param kryoClassPath Zookeeper directory path where class Name-ID + * mapping is stored. + */ + public static void setZookeeperInfo(ZooKeeperExt zookeeperExt, + String kryoClassPath) { + ZK = zookeeperExt; + KRYO_REGISTERED_CLASS_PATH = kryoClassPath; + } + + /** + * Creates a new node for the given class name. + * Creation mode is persistent sequential, i.e. + * ZK will always create a new node . There could be + * multiple entries for the same class name but since + * the lowest index is used, this is not a problem. + * @param className Class name + */ + public static void createClassName(String className) { + try { + String path = KRYO_REGISTERED_CLASS_PATH + "/" + className; + ZK.createExt(path, + null, + ZooDefs.Ids.OPEN_ACL_UNSAFE, + CreateMode.PERSISTENT_SEQUENTIAL, + true); + } catch (KeeperException e) { + throw new IllegalStateException( + "Failed to create class " + className, e); + } catch (InterruptedException e) { + throw new IllegalStateException( + "Interrupted while creating " + className, e); + } + } + + /** + * Refreshes class-ID mapping from zookeeper. + * Not thread safe. + */ + public static void refreshCache() { + try { + ZK.createOnceExt(KRYO_REGISTERED_CLASS_PATH, + null, + ZooDefs.Ids.OPEN_ACL_UNSAFE, + CreateMode.PERSISTENT, + true); + } catch (KeeperException e) { + throw new IllegalStateException( + "Failed to refresh kryo cache " + + KRYO_REGISTERED_CLASS_PATH, e); + } catch (InterruptedException e) { + throw new IllegalStateException( + "Interrupted while refreshing kryo cache " + + KRYO_REGISTERED_CLASS_PATH, e); + } + + List<String> registeredList; + try { + registeredList = + ZK.getChildrenExt(KRYO_REGISTERED_CLASS_PATH, + false, + true, + false); + } catch (KeeperException e) { + throw new IllegalStateException( + "Failed to retrieve child nodes for " + KRYO_REGISTERED_CLASS_PATH, e); + } catch (InterruptedException e) { + throw new IllegalStateException( + "Interrupted while retrieving child nodes for " + + KRYO_REGISTERED_CLASS_PATH, e); + } + + for (String name : registeredList) { + String className = name.substring(0, --- End diff -- Done. > Add kryo custom class resolver for faster serialization. > -------------------------------------------------------- > > Key: GIRAPH-1188 > URL: https://issues.apache.org/jira/browse/GIRAPH-1188 > Project: Giraph > Issue Type: Improvement > Reporter: Yuksel Akinci > Priority: Major > > The custom class resolver allows kryo to always use the integer IDs for > classes that are agreed by all nodes running the job. Default class resolver > always writes the full class name of the first encountered class type to the > stream, and then it assigns an integer for subsequent instances. These > changes make the serialization faster by eliminating the need to write the > full name for the first encountered class instance. -- This message was sent by Atlassian JIRA (v7.6.3#76005)