Source code

Java tutorial


Here is the source code for


 * Copyright 2008 the original author or authors.
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * See the License for the specific language governing permissions and
 * limitations under the License.
package net.sf.katta.zk;

import java.util.Collections;
import java.util.HashSet;
import java.util.List;
import java.util.Map;
import java.util.Set;
import java.util.concurrent.ConcurrentHashMap;
import java.util.concurrent.CopyOnWriteArraySet;
import java.util.concurrent.TimeUnit;
import java.util.concurrent.locks.Condition;
import java.util.concurrent.locks.ReentrantLock;

import net.sf.katta.util.KattaException;
import net.sf.katta.util.ZkConfiguration;

import org.apache.log4j.Logger;
import org.apache.zookeeper.CreateMode;
import org.apache.zookeeper.KeeperException;
import org.apache.zookeeper.WatchedEvent;
import org.apache.zookeeper.Watcher;
import org.apache.zookeeper.ZooKeeper;
import org.apache.zookeeper.Watcher.Event.KeeperState;
import org.apache.zookeeper.ZooDefs.Ids;

 * Abstracts the interation with zookeeper and allows permanent (not just one
 * time) watches on nodes in ZooKeeper
public class ZKClient implements Watcher {

    private final static Logger LOG = Logger.getLogger(ZKClient.class);

    private static final int MAX_RETRIES = 5;

    private ZkConfiguration _conf;
    private ZooKeeper _zk = null;
    private final ZkLock _zkEventLock = new ZkLock();

    private final Map<String, Set<IZkChildListener>> _path2ChildListenersMap = new ConcurrentHashMap<String, Set<IZkChildListener>>();
    private final Map<String, Set<IZkDataListener>> _path2DataListenersMap = new ConcurrentHashMap<String, Set<IZkDataListener>>();
    private final Set<IZkReconnectListener> _reconnectListener = new CopyOnWriteArraySet<IZkReconnectListener>();

    private final String _servers;
    private final int _port;
    private final int _timeOut;
    private boolean _shutdownTriggered;

    public ZKClient(String servers, int port, int timeout) {
        _conf = new ZkConfiguration();
        _servers = servers;
        _port = port;
        _timeOut = timeout;

    public ZKClient(final ZkConfiguration configuration) {
        _conf = configuration;
        _servers = configuration.getZKServers();
        _port = configuration.getZKClientPort();
        _timeOut = configuration.getZKTimeOut();

    public boolean isStarted() {
        return _zk != null;

     * Starts a zookeeper client and waits until connected with one of the
     * zookeeper servers.
     * @param maxMsToWaitUntilConnected
     *          the milliseconds a method call will wait until the zookeeper
     *          client is connected with the server
     * @throws KattaException
     *           if connection fails or default namespaces could not be created
    public void start(final long maxMsToWaitUntilConnected) throws KattaException {
        if (!_conf.getZKRootPath().equals(ZkConfiguration.DEFAULT_ROOT_PATH)) {
  "Using Katta root path: " + _conf.getZKRootPath());
        if (_zk != null) {
            throw new IllegalStateException("zk client has already been started");

        try {
            _shutdownTriggered = false;
            final long startTime = System.currentTimeMillis();
            try {
                _zk = new ZooKeeper(_servers, _timeOut, this);
            } catch (final Exception e) {
                _zk = null;
                throw new KattaException("Could not start zookeeper service", e);

            // wait until connected
            try {
                while (_zk.getState() == ZooKeeper.States.CONNECTING) {
                    ZooKeeper.States state = _zk.getState();
                    if (System.currentTimeMillis() - startTime > maxMsToWaitUntilConnected) {
                        _zk = null;
                        throw new KattaException(
                                "No connected with zookeeper server yet. Current state is " + state);
                    LOG.debug("Zookeeper ZkServer not yet available, sleeping...");
                    getEventLock().getStateChangedCondition().await(1000, TimeUnit.MILLISECONDS);
                    // Thread.sleep(1000);

                // createDefaultNameSpace();
            } catch (final InterruptedException e) {
                LOG.warn("waiting for the zookeeper server was interrupted", e);
        } finally {

     * Closes down the connection to zookeeper. This will remove all ephemeral
     * nodes within zookeeper this client created.
    public void close() {
        try {
            _shutdownTriggered = true;
            if (_zk != null) {
                _zk = null;
        } catch (final InterruptedException e) {
            throw new RuntimeException("unable to close zookeeper");
        } finally {

    private void ensureZkRunning() {
        try {
            if (_shutdownTriggered) {
                throw new IllegalStateException("zk client is already closing");
            if (_zk == null) {
                throw new IllegalStateException("zk client has not been started yet");
        } finally {

     * Returns a mutex all zookeeper events are synchronized aginst. So in case
     * you need to do something without getting any zookeeper event interruption
     * synchronize against this mutex. Also all threads waiting on this mutex
     * object will be notified on an event.
    public ZkLock getEventLock() {
        return _zkEventLock;

     * Subscribes an {@link IZKEventListener} for permanent notifications for
     * children changes (adds and removes) of given path.
     * @param path
     * @param listener
     * @return list of children nodes for given path.
     * @throws KattaException
     *           Thrown in case we can't read the children nodes. Note that we
     *           also remove the notification listener.
    public List<String> subscribeChildChanges(final String path, final IZkChildListener listener)
            throws KattaException {
        addChildListener(path, listener);
        try {
            return getChildren(path, true);
        } catch (final Exception e) {
            removeChildListener(path, listener);
            throw new KattaException("unable to subscribe child changes for path: " + path, e);

    public void unsubscribeChildChanges(String path, IZkChildListener childListener) {
        removeChildListener(path, childListener);

    public void unsubscribeDataChanges(String path, IZkDataListener<?> dataListener) {
        removeDataListener(path, dataListener);

    public void subscribeReconnects(final IZkReconnectListener listener) {

     * Subscribes notifications for permanent notifications for data changes on
     * the given node path.
     * @param path
     * @param listener
     * @throws KattaException
    public void subscribeDataChanges(final String path, final IZkDataListener listener) throws KattaException {
        addDataListener(path, listener);
        try {
            _zk.getData(path, true, null);
        } catch (final Exception e) {
            removeDataListener(path, listener);
            throw new KattaException("Unable to subscribe data changes for path: " + path, e);

     * Unsubscribe all listeners from zk events.
    public void unsubscribeAll() {

    private void removeDataListener(final String path, final IZkDataListener listener) {
        final Set<IZkDataListener> listeners = _path2DataListenersMap.get(path);
        if (listeners != null) {

    private void removeChildListener(final String path, final IZkChildListener listener) {
        final Set<IZkChildListener> listeners = _path2ChildListenersMap.get(path);
        if (listeners != null) {

    private void addChildListener(final String path, final IZkChildListener listener) {
        Set<IZkChildListener> listeners;
        synchronized (_path2ChildListenersMap) {
            listeners = _path2ChildListenersMap.get(path);
            if (listeners == null) {
                listeners = new CopyOnWriteArraySet<IZkChildListener>();
                _path2ChildListenersMap.put(path, listeners);

    private void addDataListener(final String path, final IZkDataListener listener) {
        Set<IZkDataListener> listeners;
        synchronized (_path2DataListenersMap) {
            listeners = _path2DataListenersMap.get(path);
            if (listeners == null) {
                listeners = new CopyOnWriteArraySet<IZkDataListener>();
                _path2DataListenersMap.put(path, listeners);

     * Creates an node for given path without any data.
     * @param path
     * @throws KattaException
    public void create(final String path) throws KattaException {
        create(path, null, CreateMode.PERSISTENT);

     * Creates an node for given path with given {@link Writable} data.
     * @param path
     * @param writable
     * @throws KattaException
    public void create(final String path, final Writable writable) throws KattaException {
        create(path, writable, CreateMode.PERSISTENT);

    private String create(final String path, final Writable writable, CreateMode mode) throws KattaException {
        assert path != null;
        final byte[] data = writableToByteArray(writable);
        char sep = _conf.getSeparator();
        try {
            // First create elements on path down to leaf node (if missing).
            String[] elements = path.split(new String(new char[] { sep }));
            String dirPath = "";
            for (int i = 0; i < elements.length - 1; i++) {
                if (elements[i].length() == 0) {
                dirPath += sep + elements[i];
                if (!exists(dirPath)) {
                    createOne(dirPath, new byte[0], CreateMode.PERSISTENT);
            // Now create leaf.
            return createOne(path, data, mode);
        } catch (final Exception e) {
            throw new KattaException("Unable to create path '" + path + "' in ZK", e);

    private String createOne(final String path, final byte[] bytes, CreateMode mode) throws KattaException {
        boolean warned = false;
        for (int t = 0; t < MAX_RETRIES; t++) {
            try {
                String s = _zk.create(path, bytes, Ids.OPEN_ACL_UNSAFE, mode);
                if (warned) {
                    LOG.warn(String.format("Created intermediate node: %s", path));
                return s;
            } catch (KeeperException.NodeExistsException e) {
                // Some one must have created it just now.
                return path;
            } catch (InterruptedException e) {
                // Ignore. Try again.
            } catch (KeeperException.ConnectionLossException e) {
                        "KeeperException.ConnectionLossException during attempt %d of %d to create intermediate node: %s",
                        t + 1, MAX_RETRIES, path));
                warned = true;
                // Should try again after a very short time.
                try {
                } catch (InterruptedException ie) {
                    // Ignore.
            } catch (KeeperException e) {
                LOG.error(String.format("Error creating intermediate node: %s", path), e);
                throw new KattaException(String.format("Unable to create intermediate node: %s", path), e);
        throw new KattaException("Unable to create intermediate node: " + path);

    private byte[] writableToByteArray(final Writable writable) throws KattaException {
        byte[] data = new byte[0];
        if (writable != null) {
            final DataOutputBuffer out = new DataOutputBuffer();
            try {
            } catch (final IOException e) {
                throw new KattaException("unable to serialize writable", e);
            data = out.getData();
        return data;

     * Creates an ephemeral node for give path. In case the client that created
     * that node disconnects the node is removed.
     * @param path
     * @throws KattaException
    public void createEphemeral(final String path) throws KattaException {
        create(path, null, CreateMode.EPHEMERAL);

     * Creates and ephemeral node with given data of the writable.
     * @param path
     * @param writable
     * @throws KattaException
    public void createEphemeral(final String path, final Writable writable) throws KattaException {
        create(path, writable, CreateMode.EPHEMERAL);

     * Deletes a given path. For recursive deletes use
     * {@link #deleteRecursive(String)}.
     * @param path
     * @return
     * @throws KattaException
    public boolean delete(final String path) throws KattaException {
        try {
            if (_zk != null) {
                _zk.delete(path, -1);
            return true;
        } catch (final KeeperException e) {
            String message = "unable to delete path: " + path;
            if (KeeperException.Code.NOTEMPTY == e.code()) {
                message += " Path has sub nodes.";
            throw new KattaException(message, e);
        } catch (final Exception e) {
            throw new KattaException("unable to delete path:" + path, e);

    public void deleteIfExists(String path) throws KattaException {
        if (exists(path)) {

     * Deletes a path and all children recursively.
     * @param path
     *          The path to delete.
     * @return true if successful.
     * @throws KattaException
    public boolean deleteRecursive(final String path) throws KattaException {
        try {
            final List<String> children = _zk.getChildren(path, false);
            for (final String child : children) {
                String subPath = path + (path.endsWith("/") ? "" : _conf.getSeparator()) + child;
                if (!deleteRecursive(subPath)) {
                    return false;
        } catch (final KeeperException e) {
            // do nothing since we simply do not have children here.
        } catch (final InterruptedException e) {
            throw new KattaException("retrieving children was interruppted", e);

        if (path.equals("/") || path.equals("/zookeeper") || path.startsWith("/zookeeper/")) {
            // Special case when root path = /. Can't delete these.
            return true;
        try {
            _zk.delete(path, -1);
        } catch (final KeeperException e) {
            if (e.code() != KeeperException.Code.NONODE) {
                throw new KattaException("unable to delete:" + path, e);
        } catch (final Exception e) {
            throw new KattaException("unable to delete:" + path, e);
        return true;

     * Checks if a node with given path exists.
     * @param path
     * @return
     * @throws KattaException
    public boolean exists(final String path) throws KattaException {
        boolean warned = false;
        for (int i = 0; i < MAX_RETRIES; i++) {
            try {
                try {
                    boolean exists = _zk.exists(path, false) != null;
                    if (warned) {
                        LOG.warn(String.format("Path %s %s", path, exists ? "exists" : "does not exist"));
                    return exists;
                } catch (KeeperException.ConnectionLossException e) {
                            "KeeperException.ConnectionLossException during attempt %d of %d to check node: %s for existence",
                            i + 1, MAX_RETRIES, path));
                    warned = true;
                    // should try again after a very short time
                } catch (KeeperException e) {
                    throw new KattaException(String.format("Unable to check path: %s", path), e);
            } catch (InterruptedException e1) {
                // ignore this since it just made us wake up a little early
        throw new KattaException(String.format("Unable to check path %s after %d retries", path, MAX_RETRIES));

    public long getCreateTime(final String path) throws KattaException {
        try {
            Stat stat = _zk.exists(path, false);
            if (stat != null) {
                return stat.getCtime();
            } else {
                return -1;
        } catch (final Exception e) {
            throw new KattaException("unable to get create time: " + path, e);

     * Returns an List of all Children names of given path.
     * @param path
     * @return
     * @throws KattaException
    public List<String> getChildren(final String path) throws KattaException {
        boolean watch = false;
        final Set<IZkChildListener> listeners = _path2ChildListenersMap.get(path);
        if (listeners != null && listeners.size() > 0) {
            watch = true;
        return getChildren(path, watch);

     * Helper method to eliminate Connection Loss related exceptions
     * @param path
     * @param isToLeaveWatch
     * @return
     * @throws KattaException
    private List<String> getChildren(final String path, boolean isToLeaveWatch) throws KattaException {
        boolean warned = false;
        for (int i = 0; i < MAX_RETRIES; i++) {
            try {
                List<String> children = _zk.getChildren(path, isToLeaveWatch);
                if (warned) {
                    LOG.warn("Got children for path: " + path);
                return children;
            } catch (KeeperException.ConnectionLossException e) {
                        "Lost connection to ZK while trying to get children of: %s. Attempt %d of %d. Reconnecting.",
                        path, i + 1, MAX_RETRIES), e);
                warned = true;
                try {
                } catch (InterruptedException e1) {
                    // Ignore this one.
            } catch (InterruptedException e1) {
                // Ignore this since it just made us wake up a little early .
            } catch (final Exception e) {
                throw new KattaException("Warning: unable to retrieve children: " + path, e);
        throw new KattaException("Warning: unable to retrieve children: " + path);

    public int countChildren(String path) throws KattaException {
        int childCount = 0;
        if (exists(path)) {
            childCount = getChildren(path).size();
        return childCount;

    public void process(WatchedEvent event) {

        // public void process(final WatcherEvent event) {
        // if (null == event.getPath()) {
        // // prohibit nullpointer (See ZOOKEEPER-77)
        // event.setPath("null");
        // }
        boolean stateChanged = event.getState() == KeeperState.Disconnected
                || event.getState() == KeeperState.Expired;
        boolean dataChanged = event.getType() == Watcher.Event.EventType.NodeDataChanged
                || event.getType() == Watcher.Event.EventType.NodeChildrenChanged
                || event.getType() == Watcher.Event.EventType.NodeDeleted;
        try {
            if (_shutdownTriggered) {
                LOG.debug("ignoring event '{" + event.getType() + " | " + event.getPath()
                        + "}' since shutdown triggered");
            if (event.getState() == KeeperState.Expired) {
            if (dataChanged) {
        } finally {
            if (stateChanged) {
            if (dataChanged) {

    private void processExpiration(WatchedEvent event) {
        // we do a reconnect
        LOG.warn("Zookeeper session expired (" + event + ")");
        if (_shutdownTriggered) {
            // already closing
        } else {
            LOG.warn("Reconnecting to Zookeeper");

    private void processDataOrChildChange(WatchedEvent event) {
        // ZkEventType eventType = ZkEventType.getMappedType(event.getType());
        final String path = event.getPath();

        if (event.getType() == Watcher.Event.EventType.NodeChildrenChanged) {
            Set<IZkChildListener> childListeners = _path2ChildListenersMap.get(path);
            if (childListeners != null && !childListeners.isEmpty()) {
                // since resubscribeChildPath might remove listener from listeners
                // because they throw exeception we need to copy the listener first to
                // make sure we also notify listener we could not re subscribe to the
                // given path
                HashSet<IZkChildListener> copiedSet = new HashSet<IZkChildListener>();

                List<String> children = resubscribeChildPath(path, childListeners);

                for (final IZkChildListener listener : copiedSet) {
                    try {
                        listener.handleChildChange(event.getPath(), children);
                    } catch (final Throwable e) {
                        LOG.error("Faild to process event with listener: " + listener, e);
        } else {
            Set<IZkDataListener> listeners = _path2DataListenersMap.get(path);
            if (listeners != null && !listeners.isEmpty()) {

                HashSet<IZkDataListener> copiedSet = new HashSet<IZkDataListener>();
                byte[] data = resubscribeDataPath(path, listeners);

                for (final IZkDataListener listener : copiedSet) {
                    try {
                        if (event.getType() == Watcher.Event.EventType.NodeCreated) {
                                    readWritable(listener.createWritable(), data));
                        } else if (event.getType() == Watcher.Event.EventType.NodeDataChanged) {
                                    readWritable(listener.createWritable(), data));
                        } else if (event.getType() == Watcher.Event.EventType.NodeDeleted) {
                        } else {
                            LOG.error("Received a unknown event, ignoring: " + event.getType());
                    } catch (final Throwable e) {
                        LOG.error("Faild to process event " + event.getType() + " with listener: " + listener, e);

    private byte[] resubscribeDataPath(final String path, final Set<IZkDataListener> listeners) {
        byte[] data = null;
        try {
            data = _zk.getData(path, true, null);
        } catch (final Exception e) {
            for (final IZkDataListener listener : listeners) {
                removeDataListener(path, listener);
            LOG.fatal("resubscription for data changes on path '" + path + "' failed. removing listeners", e);
        return data;

    private List<String> resubscribeChildPath(final String path, final Set<IZkChildListener> childListeners) {
        List<String> children;
        try {
            children = getChildren(path, true);
        } catch (final Exception e) {
            LOG.fatal("re-subscription for child changes on path '" + path + "' failed. removing listeners", e);
            children = Collections.emptyList();
            // childListeners.clear();
        return children;

    private void reconnect() {
        try {
            start(1000 * 60 * 10);
            for (IZkReconnectListener reconnectListener : _reconnectListener) {
        } catch (final Throwable t) {
            throw new RuntimeException("Exception while restarting zk client", t);

     * Reads that data of given path into a writeable instance. Make sure you use
     * the same writable implementation as you used to write the data.
     * @param path
     * @param writable
     * @return
     * @throws KattaException
    public void readData(final String path, final Writable writable) throws KattaException {
        byte[] data;
        boolean watch = false;
        final Set<IZkDataListener> set = _path2DataListenersMap.get(path);
        if (set != null && set.size() > 0) {
            watch = true;
        try {
            data = _zk.getData(path, watch, null);
        } catch (final Exception e) {
            throw new KattaException("Failed to read data for: " + path, e);
        readWritable(writable, data);

    public <T extends Writable> T readData(final String path, final Class<T> writableClass) throws KattaException {
        T newInstance;
        try {
            newInstance = writableClass.newInstance();
        } catch (Exception e) {
            throw new RuntimeException("could not create instance of " + writableClass.getName(), e);
        readData(path, newInstance);
        return newInstance;

    private Writable readWritable(final Writable writable, byte[] data) throws KattaException {
        final DataInputBuffer buffer = new DataInputBuffer();
        buffer.reset(data, data.length);
        try {
        } catch (final IOException e) {
            throw new KattaException("unable to read data into Writable", e);
        } finally {
            try {
            } catch (IOException e) {
                LOG.warn("could not close data buffer", e);
        return writable;

     * Shows the full node structure of the Zookeeper server. Useful for
     * debugging.
     * @throws KattaException
    public void showFolders(boolean all, OutputStream output) throws KattaException {
        final int level = 1;
        final StringBuilder builder = new StringBuilder();
        final String startPath = all ? new String(new char[] { _conf.getSeparator() }) : _conf.getZKRootPath();
        builder.append(startPath + "\n");
        addChildren(level, builder, startPath);
        try {
        } catch (final IOException e) {

    private void addChildren(final int level, final StringBuilder builder, final String startPath)
            throws KattaException {
        List<String> children = Collections.emptyList();
        try {
            children = getChildren(startPath);
        } catch (KattaException e) {
        for (final String node : children) {
            String childPath = startPath + (startPath.endsWith("/") ? "" : "/") + node;
            boolean hasKids = !getChildren(childPath).isEmpty();
            char connector = hasKids ? '+' : '-';
            builder.append(getSpaces(level - 1) + "'-" + connector + node + "\n");

            addChildren(level + 1, builder, (startPath + "/" + node).replaceAll("//", "/"));

    private String getSpaces(final int level) {
        String s = "";
        for (int i = 0; i < level; i++) {
            s += "  ";
        return s;

     * Creates a node and writes data of writable into the given path.
     * @param path
     * @param writable
     * @throws KattaException
    public void writeData(final String path, final Writable writable) throws KattaException {
        final byte[] data = writableToByteArray(writable);
        try {
            _zk.setData(path, data, -1);
        } catch (final Exception e) {
            throw new KattaException("Unable to write data for: " + path, e);

    public int getPort() {
        return _port;

    public ZooKeeper.States getZookeeperState() {
        return _zk != null ? _zk.getState() : null;

    // **************************************************
    // ********** katta specific methods
    // **************************************************

     * Creates a set of default folder structure for katta within a zookeeper .
     * @throws KattaException
    public void createDefaultNameSpace() throws KattaException {
        LOG.debug("Creating default File structure if required....");
        try {
            if (!exists(_conf.getZKRootPath())) {
            if (!exists(_conf.getZKIndicesPath())) {
            if (!exists(_conf.getZKNodesPath())) {
            if (!exists(_conf.getZKNodeToShardPath())) {
            if (!exists(_conf.getZKShardToNodePath())) {
            if (!exists(_conf.getZKShardToErrorPath())) {
            if (!exists(_conf.getZKLoadTestPath())) {
        } catch (KattaException e) {
            if (e.getCause() instanceof KeeperException
                    && e.getCause().getMessage().contains("KeeperErrorCode = NodeExists")) {
                // if components starting concurrently the exists is not safe
                LOG.debug("could not create default namespace " + e.getCause().getMessage());
            } else {
                throw e;

     * @return all nodes known to the system, also if currently disconnected
    public List<String> getKnownNodes() throws KattaException {
        return getChildren(_conf.getZKNodeToShardPath());

     * @return all nodes connected to th zk system
    public List<String> getAliveNodes() throws KattaException {
        return getChildren(_conf.getZKNodesPath());

    public ZkConfiguration getConfig() {
        return _conf;

    public static class ZkLock extends ReentrantLock {

        private static final long serialVersionUID = 1L;

        private Condition _dataChangedCondition = newCondition();
        private Condition _stateChangedCondition = newCondition();

         * This condition will be signaled if a zookeeper event was processed and
         * the event contains a data/child change.
        public Condition getDataChangedCondition() {
            return _dataChangedCondition;

         * This condition will be signaled if a zookeeper event was processed and
         * the event contains a state change (connected, disconnected, session
         * expired, etc ...).
        public Condition getStateChangedCondition() {
            return _stateChangedCondition;

